DavidGF commited on
Commit
fb4ea92
1 Parent(s): a32a34e

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/root/.cache/huggingface/hub/models--VAGOsolutions--SauerkrautLM-gemma-2-9b-it/snapshots/8e02fc1c24e0499c74ee1186ddc46b989fe497f1",
3
  "architectures": [
4
  "Gemma2ForCausalLM"
5
  ],
@@ -23,8 +23,13 @@
23
  "num_key_value_heads": 8,
24
  "pad_token_id": 0,
25
  "quantization_config": {
 
26
  "bits": 4,
 
 
 
27
  "group_size": 128,
 
28
  "modules_to_not_convert": null,
29
  "quant_method": "awq",
30
  "version": "gemm",
@@ -35,7 +40,7 @@
35
  "rope_theta": 10000.0,
36
  "sliding_window": 4096,
37
  "sliding_window_size": 4096,
38
- "torch_dtype": "float16",
39
  "transformers_version": "4.45.2",
40
  "use_cache": false,
41
  "vocab_size": 256000
 
1
  {
2
+ "_name_or_path": "VAGOsolutions/SauerkrautLM-gemma-2-9b-it",
3
  "architectures": [
4
  "Gemma2ForCausalLM"
5
  ],
 
23
  "num_key_value_heads": 8,
24
  "pad_token_id": 0,
25
  "quantization_config": {
26
+ "backend": "autoawq",
27
  "bits": 4,
28
+ "do_fuse": false,
29
+ "exllama_config": null,
30
+ "fuse_max_seq_len": null,
31
  "group_size": 128,
32
+ "modules_to_fuse": null,
33
  "modules_to_not_convert": null,
34
  "quant_method": "awq",
35
  "version": "gemm",
 
40
  "rope_theta": 10000.0,
41
  "sliding_window": 4096,
42
  "sliding_window_size": 4096,
43
+ "torch_dtype": "bfloat16",
44
  "transformers_version": "4.45.2",
45
  "use_cache": false,
46
  "vocab_size": 256000
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecc01efa16360296837df01926e3249b5422064fea3d99fa1b347f7a99cec0e6
3
- size 6835062392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e38734fa8550c5e4600ef3303479da9215b821ddbe962c476b14b0496214cf
3
+ size 5000054416
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6baeb948526c1f7f7670d1b117d980d383530a32e248d49167c6ad944c517a1c
3
- size 1160653528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f500a8489f8d147e97d10068bcefe245e1d60637b5269ae1ee101a350c19cddc
3
+ size 1160653576
model.safetensors.index.json CHANGED
The diff for this file is too large to render. See raw diff