Shamane commited on
Commit
97dadb5
·
verified ·
1 Parent(s): cedb246

Upload MistralForCausalLM

Browse files
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "mistralai/Mistral-7B-v0.1",
3
+ "architectures": [
4
+ "MistralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 32,
17
+ "num_hidden_layers": 32,
18
+ "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_theta": 10000.0,
21
+ "sliding_window": 4096,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.44.2",
25
+ "use_cache": true,
26
+ "vocab_size": 32000
27
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.44.2"
6
+ }
model-00001-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82e0874a5b5bc66986f41f713fad5b2cda2839b0a4daee68f9c1da6f645fdbbc
3
+ size 4992325120
model-00002-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c251c7e52fa81dfd99ba91f7425eca926f3058c5ddd27c450ed969a181d731b
3
+ size 4984151552
model-00003-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f756dc759334f17924a5dfcf78534d3a4d962d483a042b9d303aa171fbdf9d5d
3
+ size 4916809056
model-00004-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99095eb3bd34300b7fdb5a0212b64d7d63c2224f0ae4e7f646e61d4347edb36d
3
+ size 4883521784
model-00005-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a9544a37b428881e6c682f57d3edb52a958d593b707f95652d08fdfd8bcf98f
3
+ size 4883406784
model-00006-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ae8402ffecd2769576b4ff9ab8b259be9c123795ddf3222306edfafb2f0b58
3
+ size 4883488680
model-00007-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bb1ed2527f992f334d8afb00eb2cc05602bafa96223d7a205c4ed041db095f4
3
+ size 4967374784
model-00008-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f1592df82f18c771df91520c04d2a42abd511dd6303ac65be4b63afc2fc2f4c
3
+ size 4967306968
model-00009-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2ebf7ddd65777363662ebfd4d38301e7ce8691b5d91a2d52b6c0589f47d5eab
3
+ size 4967241776
model-00010-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2c4452203e6e042f4c82d2f1813152c23116ce49f4ed9c50c392625016c092c
3
+ size 4883406776
model-00011-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75f227ce85aea17f298e944efd58dd1df539d98fc5f8945e961df1ad27f07ba8
3
+ size 4883521896
model-00012-of-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58ab3641aaf7035d46096063460cbe1501a3d9c1e7c052f74f8197ac5e022f42
3
+ size 3733730272
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff