NeoChen1024 commited on
Commit
34b8679
·
verified ·
1 Parent(s): c4a6538

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -58,7 +58,7 @@
58
  }
59
  },
60
  "format": "int-quantized",
61
- "global_compression_ratio": 1.458959021662211,
62
  "ignore": [
63
  "lm_head"
64
  ],
@@ -77,7 +77,7 @@
77
  "rope_theta": 500000.0,
78
  "tie_word_embeddings": false,
79
  "torch_dtype": "bfloat16",
80
- "transformers_version": "4.47.1",
81
  "use_cache": false,
82
  "vocab_size": 128258
83
  }
 
58
  }
59
  },
60
  "format": "int-quantized",
61
+ "global_compression_ratio": 1.5282327198317063,
62
  "ignore": [
63
  "lm_head"
64
  ],
 
77
  "rope_theta": 500000.0,
78
  "tie_word_embeddings": false,
79
  "torch_dtype": "bfloat16",
80
+ "transformers_version": "4.48.0",
81
  "use_cache": false,
82
  "vocab_size": 128258
83
  }
generation_config.json CHANGED
@@ -10,5 +10,5 @@
10
  ],
11
  "temperature": 0.6,
12
  "top_p": 0.9,
13
- "transformers_version": "4.47.1"
14
  }
 
10
  ],
11
  "temperature": 0.6,
12
  "top_p": 0.9,
13
+ "transformers_version": "4.48.0"
14
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a72689e38e01904d861bde6b93babad602483c34a197d2e1014d9ec172833f3e
3
  size 4999417248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f513eec475d256a7f56228ad4982b406b156e04a5a5a78a6b2fa1c954d30ef1f
3
  size 4999417248
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baf71f14e5867c0382e0efc7cbf5618c0625c892d276deb97c0a670b65a9d2a7
3
  size 4084628880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7267604493236610ecb144e2b256f887388b1e5980c93a32d03019e276dad2b
3
  size 4084628880
recipe.yaml CHANGED
@@ -3,5 +3,6 @@ DEFAULT_stage:
3
  SmoothQuantModifier: {smoothing_strength: 0.8}
4
  GPTQModifier:
5
  targets: Linear
 
6
  ignore: [lm_head]
7
  scheme: W8A8
 
3
  SmoothQuantModifier: {smoothing_strength: 0.8}
4
  GPTQModifier:
5
  targets: Linear
6
+ dampening_frac: 0.1
7
  ignore: [lm_head]
8
  scheme: W8A8
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cca43616769fed4807470fb41ccf7f5eebdd08624e7b9adafc09d99332cf31eb
3
- size 17210297
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe64d8928b8843143ff63a86ef01beafd2943e72090bb5f9800db4a97f5c7e5f
3
+ size 17210579