Upload folder using huggingface_hub

Browse files

Files changed (14) hide show

.gitattributes +12 -0
README.md +172 -0
falcon-mamba-7b-Q2_K.gguf +3 -0
falcon-mamba-7b-Q3_K_L.gguf +3 -0
falcon-mamba-7b-Q3_K_M.gguf +3 -0
falcon-mamba-7b-Q3_K_S.gguf +3 -0
falcon-mamba-7b-Q4_0.gguf +3 -0
falcon-mamba-7b-Q4_K_M.gguf +3 -0
falcon-mamba-7b-Q4_K_S.gguf +3 -0
falcon-mamba-7b-Q5_0.gguf +3 -0
falcon-mamba-7b-Q5_K_M.gguf +3 -0
falcon-mamba-7b-Q5_K_S.gguf +3 -0
falcon-mamba-7b-Q6_K.gguf +3 -0
falcon-mamba-7b-Q8_0.gguf +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
+falcon-mamba-7b-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,172 @@

+---
+language:
+- en
+datasets:
+- tiiuae/falcon-refinedweb
+- HuggingFaceFW/fineweb-edu
+license: other
+license_name: falcon-mamba-7b-license
+license_link: https://falconllm.tii.ae/falcon-mamba-7b-terms-and-conditions.html
+base_model: tiiuae/falcon-mamba-7b
+tags:
+- TensorBlock
+- GGUF
+model-index:
+- name: falcon-mamba-7b
+  results:
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: IFEval (0-Shot)
+      type: HuggingFaceH4/ifeval
+      args:
+        num_few_shot: 0
+    metrics:
+    - type: inst_level_strict_acc and prompt_level_strict_acc
+      value: 33.36
+      name: strict accuracy
+    source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=tiiuae/falcon-mamba-7b
+      name: Open LLM Leaderboard
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: BBH (3-Shot)
+      type: BBH
+      args:
+        num_few_shot: 3
+    metrics:
+    - type: acc_norm
+      value: 19.88
+      name: normalized accuracy
+    source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=tiiuae/falcon-mamba-7b
+      name: Open LLM Leaderboard
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: MATH Lvl 5 (4-Shot)
+      type: hendrycks/competition_math
+      args:
+        num_few_shot: 4
+    metrics:
+    - type: exact_match
+      value: 3.63
+      name: exact match
+    source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=tiiuae/falcon-mamba-7b
+      name: Open LLM Leaderboard
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: GPQA (0-shot)
+      type: Idavidrein/gpqa
+      args:
+        num_few_shot: 0
+    metrics:
+    - type: acc_norm
+      value: 8.05
+      name: acc_norm
+    source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=tiiuae/falcon-mamba-7b
+      name: Open LLM Leaderboard
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: MuSR (0-shot)
+      type: TAUR-Lab/MuSR
+      args:
+        num_few_shot: 0
+    metrics:
+    - type: acc_norm
+      value: 10.86
+      name: acc_norm
+    source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=tiiuae/falcon-mamba-7b
+      name: Open LLM Leaderboard
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: MMLU-PRO (5-shot)
+      type: TIGER-Lab/MMLU-Pro
+      config: main
+      split: test
+      args:
+        num_few_shot: 5
+    metrics:
+    - type: acc
+      value: 14.47
+      name: accuracy
+    source:
+      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=tiiuae/falcon-mamba-7b
+      name: Open LLM Leaderboard
+---
+<div style="width: auto; margin-left: auto; margin-right: auto">
+<img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
+</div>
+<div style="display: flex; justify-content: space-between; width: 100%;">
+    <div style="display: flex; flex-direction: column; align-items: flex-start;">
+        <p style="margin-top: 0.5em; margin-bottom: 0em;">
+            Feedback and support: TensorBlock's  <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
+        </p>
+    </div>
+</div>
+## tiiuae/falcon-mamba-7b - GGUF
+This repo contains GGUF format model files for [tiiuae/falcon-mamba-7b](https://huggingface.co/tiiuae/falcon-mamba-7b).
+The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4011](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
+## Prompt template
+```
+```
+## Model file specification
+| Filename | Quant type | File Size | Description |
+| -------- | ---------- | --------- | ----------- |
+| [falcon-mamba-7b-Q2_K.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q2_K.gguf) | Q2_K | 2.389 GB | smallest, significant quality loss - not recommended for most purposes |
+| [falcon-mamba-7b-Q3_K_S.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q3_K_S.gguf) | Q3_K_S | 3.050 GB | very small, high quality loss |
+| [falcon-mamba-7b-Q3_K_M.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q3_K_M.gguf) | Q3_K_M | 3.050 GB | very small, high quality loss |
+| [falcon-mamba-7b-Q3_K_L.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q3_K_L.gguf) | Q3_K_L | 3.050 GB | small, substantial quality loss |
+| [falcon-mamba-7b-Q4_0.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q4_0.gguf) | Q4_0 | 3.915 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
+| [falcon-mamba-7b-Q4_K_S.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q4_K_S.gguf) | Q4_K_S | 3.915 GB | small, greater quality loss |
+| [falcon-mamba-7b-Q4_K_M.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q4_K_M.gguf) | Q4_K_M | 3.915 GB | medium, balanced quality - recommended |
+| [falcon-mamba-7b-Q5_0.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q5_0.gguf) | Q5_0 | 4.730 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
+| [falcon-mamba-7b-Q5_K_S.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q5_K_S.gguf) | Q5_K_S | 4.730 GB | large, low quality loss - recommended |
+| [falcon-mamba-7b-Q5_K_M.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q5_K_M.gguf) | Q5_K_M | 4.730 GB | large, very low quality loss - recommended |
+| [falcon-mamba-7b-Q6_K.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q6_K.gguf) | Q6_K | 5.595 GB | very large, extremely low quality loss |
+| [falcon-mamba-7b-Q8_0.gguf](https://huggingface.co/tensorblock/falcon-mamba-7b-GGUF/tree/main/falcon-mamba-7b-Q8_0.gguf) | Q8_0 | 7.232 GB | very large, extremely low quality loss - not recommended |
+## Downloading instruction
+### Command line
+Firstly, install Huggingface Client
+```shell
+pip install -U "huggingface_hub[cli]"
+```
+Then, downoad the individual model file the a local directory
+```shell
+huggingface-cli download tensorblock/falcon-mamba-7b-GGUF --include "falcon-mamba-7b-Q2_K.gguf" --local-dir MY_LOCAL_DIR
+```
+If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
+```shell
+huggingface-cli download tensorblock/falcon-mamba-7b-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
+```

falcon-mamba-7b-Q2_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8325c406eda952b24c46d08c792b755486c2e1e3d7809398e34e1aabe0f4635
+size 2565011200

falcon-mamba-7b-Q3_K_L.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cfb9598415e196bd3f7a007a566ecda6a6c21423fb3947f05ed5fe48eb723044
+size 3275339520

falcon-mamba-7b-Q3_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:611ddf623476068e97afadd9faa6a7030f065464d70d19746f62b5f6c61ca169
+size 3275339520

falcon-mamba-7b-Q3_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1566471de457162ef3c9c379fb91bfc3a5880b4a41831741f16f8dabeaed6c4e
+size 3275339520

falcon-mamba-7b-Q4_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88e6c41a1eb366f1405da691d41283b43b6c99b0507f750bf8a443fd24d7d1c1
+size 4204230400

falcon-mamba-7b-Q4_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eaa31dbf8058c867844df9a47f1a4834dfc413e5f9d0ce10d710904668bede7f
+size 4204230400

falcon-mamba-7b-Q4_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3b4c9fd92701725cb511bd5b6a94a38e0e03baeae51c1212ee8254ea44b6880
+size 4204230400

falcon-mamba-7b-Q5_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f70d60c9b92cf1e78f5aa31fdded73992461724d17470e5f2bf67b8a81ff2996
+size 5078480640

falcon-mamba-7b-Q5_K_M.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c032f66d7c42362872b8e69789d7f8d15f89b46f1b22097bb125f7e2af5edc67
+size 5078480640

falcon-mamba-7b-Q5_K_S.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b991276af7a5a799b17b39593373afaa75b27b685423321a87ac7459b5618d45
+size 5078480640

falcon-mamba-7b-Q6_K.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7a14c58e487988aadaa1c1d078b1d41327ba89c3a3e3d54f890af65cfc8898f
+size 6007371520

falcon-mamba-7b-Q8_0.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2415f0eab5cc36d3a1c930e8235448311376c18e344bda5893f78059c80f1dc
+size 7765735168