NeoChen1024
commited on
Upload folder using huggingface_hub
Browse files- config.json +2 -2
- generation_config.json +1 -1
- model-00001-of-00002.safetensors +1 -1
- model-00002-of-00002.safetensors +1 -1
- recipe.yaml +1 -0
- tokenizer.json +2 -2
config.json
CHANGED
@@ -58,7 +58,7 @@
|
|
58 |
}
|
59 |
},
|
60 |
"format": "int-quantized",
|
61 |
-
"global_compression_ratio": 1.
|
62 |
"ignore": [
|
63 |
"lm_head"
|
64 |
],
|
@@ -77,7 +77,7 @@
|
|
77 |
"rope_theta": 500000.0,
|
78 |
"tie_word_embeddings": false,
|
79 |
"torch_dtype": "bfloat16",
|
80 |
-
"transformers_version": "4.
|
81 |
"use_cache": false,
|
82 |
"vocab_size": 128258
|
83 |
}
|
|
|
58 |
}
|
59 |
},
|
60 |
"format": "int-quantized",
|
61 |
+
"global_compression_ratio": 1.5282327198317063,
|
62 |
"ignore": [
|
63 |
"lm_head"
|
64 |
],
|
|
|
77 |
"rope_theta": 500000.0,
|
78 |
"tie_word_embeddings": false,
|
79 |
"torch_dtype": "bfloat16",
|
80 |
+
"transformers_version": "4.48.0",
|
81 |
"use_cache": false,
|
82 |
"vocab_size": 128258
|
83 |
}
|
generation_config.json
CHANGED
@@ -10,5 +10,5 @@
|
|
10 |
],
|
11 |
"temperature": 0.6,
|
12 |
"top_p": 0.9,
|
13 |
-
"transformers_version": "4.
|
14 |
}
|
|
|
10 |
],
|
11 |
"temperature": 0.6,
|
12 |
"top_p": 0.9,
|
13 |
+
"transformers_version": "4.48.0"
|
14 |
}
|
model-00001-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999417248
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f513eec475d256a7f56228ad4982b406b156e04a5a5a78a6b2fa1c954d30ef1f
|
3 |
size 4999417248
|
model-00002-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4084628880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7267604493236610ecb144e2b256f887388b1e5980c93a32d03019e276dad2b
|
3 |
size 4084628880
|
recipe.yaml
CHANGED
@@ -3,5 +3,6 @@ DEFAULT_stage:
|
|
3 |
SmoothQuantModifier: {smoothing_strength: 0.8}
|
4 |
GPTQModifier:
|
5 |
targets: Linear
|
|
|
6 |
ignore: [lm_head]
|
7 |
scheme: W8A8
|
|
|
3 |
SmoothQuantModifier: {smoothing_strength: 0.8}
|
4 |
GPTQModifier:
|
5 |
targets: Linear
|
6 |
+
dampening_frac: 0.1
|
7 |
ignore: [lm_head]
|
8 |
scheme: W8A8
|
tokenizer.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe64d8928b8843143ff63a86ef01beafd2943e72090bb5f9800db4a97f5c7e5f
|
3 |
+
size 17210579
|