CharlieFRuan
commited on
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +41 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 5120,
|
6 |
+
"intermediate_size": 13824,
|
7 |
+
"num_attention_heads": 40,
|
8 |
+
"num_hidden_layers": 40,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32016,
|
11 |
+
"position_embedding_base": 1000000,
|
12 |
+
"context_window_size": 16384,
|
13 |
+
"prefill_chunk_size": 16384,
|
14 |
+
"num_key_value_heads": 40,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 32016,
|
20 |
+
"context_window_size": 16384,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 16384,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.95,
|
31 |
+
"conv_template": "LM",
|
32 |
+
"pad_token_id": 0,
|
33 |
+
"bos_token_id": 1,
|
34 |
+
"eos_token_id": 2,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.model",
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"version": "0.1.0"
|
41 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7de43e395a7ecf868d21f686a1387e9e57b68666f4785b440cb49436756666c9
|
3 |
+
size 81960960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:754101f9a58edaebf2feee43c3f39510606ca5c157b152e77f059a1e89edaf00
|
3 |
+
size 35389440
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83197629a8e1990e5af7b7c479d974b528864b4d06629716cfa70d7f0d9ab871
|
3 |
+
size 35389440
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2bc4433f1a568f720c11a01b996b2d3f1789a6ffc1761d40cfee70db2eb15c9
|
3 |
+
size 35389440
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03db64985b3a66e4496fe44f251f86731c6396b8f56d553d463fe765ec4e2cdd
|
3 |
+
size 32952320
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99e706ee08ee224d1f8e412afbcf5d5c72b91818586be0db21eeee219f6a60e2
|
3 |
+
size 70778880
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7591d77e9072a46689e171edcccde6d2f72d27ea01414dde9884108c6753636
|
3 |
+
size 35389440
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b0c91f088c1e104ec919689958c0aab0876dc39c035427bd8e2b3595bfe44bf
|
3 |
+
size 70778880
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:944071a05df34c39669b7f2cbee05a388a9c5a5860048f297ced94dbac884e88
|
3 |
+
size 32460800
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:326b2f40aec43177ef1be8c1d3ed3625ab949fa46b8f394b4c105f82fba7fcbe
|
3 |
+
size 39321600
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa0dbefedbac6294a1a39cbbac432eb61431cd7bbad2769550a64bcfc9c7eb60
|
3 |
+
size 35389440
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d70c0d863bf242eb5270a708338eda091e8a2b54429bd17de5ab60b0c66d404
|
3 |
+
size 70778880
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51934f974c2ca0f1ac0e37b7711667f9844afa3b2f051175da817e1c03f92dec
|
3 |
+
size 32952320
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abb8b7c8d65323f288e555a8a388822772ca752b7700712439a494bd8c1ef5fb
|
3 |
+
size 70778880
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e82ac620b278d33994c3451a0b3e90c3cabd314cdcad05161e23a81d22dad426
|
3 |
+
size 39321600
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f55bc271c290c22d50822bd1d781dc3980264f7c70dcffab9ce8218f08638aa5
|
3 |
+
size 35389440
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f01aa6cb70355cdf1d2c28ef06835417870d8419836dd71af8fdd3fdb60ceac
|
3 |
+
size 70778880
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae2e45b959538612e2f1307aab4153fee442d95aea84f9da5ad2945ae5083a14
|
3 |
+
size 32952320
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f36f97d5c347a6e78f63537a66e53ba3ee8be73a29d83b367a249c2fce4effd9
|
3 |
+
size 39321600
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a851e49395cd8ecaeb74f070f6cbdab9f0d4d79baef41bd8c173cb6c3d8c59f
|
3 |
+
size 35389440
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ccff38f8cfa4ea18433a81cd45b967eefedd413311a7b840fa5e7263b8246cb
|
3 |
+
size 70778880
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea9a93152b0711dad36fd6fb86f4b964c74378aa5f37d8f8835e7881e1600a40
|
3 |
+
size 32952320
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f20de57a3177795c6c912427a2b2af1e76ed55c11939da0b4bbc08128756e6
|
3 |
+
size 39321600
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fb70b41a9ec0ba1b0b027fa12eaf0b5c3b51737107e6cc52d5fc8614213c35d
|
3 |
+
size 35389440
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ee261e7d636f0ea8d78ae78cbd50d9db306485de4f252dd088010edf4cefdee
|
3 |
+
size 39321600
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd1c6abfdc0fe23c2ed3bbd1b1e520fad41cf5657385907abcfa376f8ebef4d8
|
3 |
+
size 70778880
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc9d554be49282eebd94e9da1e431ffdae28bf8c588ddb88d5b8507acd5cf128
|
3 |
+
size 32952320
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3156db8e8f2c6f59bf9f2f54c1aba45c4aa1b35c402b49e262bf051d5a25b31
|
3 |
+
size 39321600
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cba66c5b1a7a2e4e9d7e1faeebe8c25605e9936fb5a82e752c24c7c951d126f
|
3 |
+
size 35389440
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd5f44474c7d621aab12b8f7010675b436d0ae9c2fee5b6a93ef5bb4bf208fc1
|
3 |
+
size 70778880
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cd636504b03b1d7fffc397b4f70701999a0ddedffe7a6838f84a6f872a7dcca
|
3 |
+
size 32952320
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0271b914662e2946397d31185664a535800cd95daa74cfd2cce2233533e47c7
|
3 |
+
size 39321600
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f34050896ad34b3cde16646a675db0d432b373e49490480a6cc0bfac97db5ad
|
3 |
+
size 35389440
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07255f7d9228ee8b3bf48e1a3edcf79fc748702592bd7398a33a8db85fea92c9
|
3 |
+
size 70778880
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1909bffa38e9ff1f56f2d8666124f454d8213b5736012e51c7a5d122a14c662e
|
3 |
+
size 32952320
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23aa271deb0fc94eff629cb6031ad056b86f8596843f8b2e230eb7e3e217ea34
|
3 |
+
size 32952320
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf0908167766dfaec3254ff6b87fea1384d3f30c8f8d519982863059c4b33881
|
3 |
+
size 39321600
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73407d96f71dad248bfbba32bb35cbd9f0f1edf16d3f6ff8e55efaa4205502a1
|
3 |
+
size 35389440
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bc6af27a66b2f77eb5341e250d0193c43e4644efd4398a3a43c659a0f9f5cb2
|
3 |
+
size 70778880
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1296c21ecb03803d97363148baf705e711d456071e5c15015e8d7a5b06651e9d
|
3 |
+
size 32952320
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c66e26e33903095cf0e81cd897564a3dca1a51ed1d49236bdbe71d30901517fe
|
3 |
+
size 39321600
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2baed07fc9631820d4db0371d4b68828deeb79f629b1b48997ecb83f26063934
|
3 |
+
size 35389440
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dd6141dce2e93ae35d528a1c5c89e5df804e98382265b5e25f938bfdb20bdc8
|
3 |
+
size 70778880
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d882c1e0cd5d99f940aa5c44edde5873195807273f5a70df6d8ec001caa3bcd0
|
3 |
+
size 32952320
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2bf78d487cdf8164300f46ddfb745f930707c9b39e37920c07746e157beef46
|
3 |
+
size 39321600
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a9d5e7d96e3298e23cd9389406a405b6dfe139ea21c09fe635d304791f943c6
|
3 |
+
size 35389440
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ae41431cb168616708ab4c2a3b29f590f97deac5ea7d2e6477dbad0af3a4fd0
|
3 |
+
size 35389440
|