at676 commited on
Commit
0eff310
·
1 Parent(s): ecf2e38

Upload folder using huggingface_hub (#1)

Browse files

- 946793be5025b9792ce96bace8ec5c7ddb7860323730e627693ff9fb7e5d0cc9 (210735dc9c2a16373e87d323069209d00ec1e259)
- 28607bdfd91eb825246c1983a4acb9f5a24704e3b23e4c35bc492dc7c7dc89f3 (a6c4a06016757b870a181ab90faf86f1d6753379)
- 39077dbcdb8cc83363e63b482e1f2ffb14b5ac8e3823882e038accb2452a0e89 (a878dde64a350febd26b486aafc05d465c28fae7)
- 4cf319c8c2365b4603a774958c3002186900b1605006b92d1afde68d51ba5f67 (255af5ae35c1da028a3ab46563802935dba686e3)
- 2023d1399f80755098819eb6773e903eb79846573481cb4b9a7df16d172741d0 (a9c90c7e2df6b318a6b8140ee44465bda1532741)

config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "relaxml/Llama-1-65b-hf",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 8192,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 22016,
13
+ "max_position_embeddings": 2048,
14
+ "model_type": "llama",
15
+ "num_attention_heads": 64,
16
+ "num_hidden_layers": 80,
17
+ "num_key_value_heads": 64,
18
+ "pretraining_tp": 1,
19
+ "quip_params": {
20
+ "codebook": "E8P12RVQ4B",
21
+ "codebook_version": 1,
22
+ "codesz": 8,
23
+ "fused": true,
24
+ "idx_dtype": "torch.int64",
25
+ "lora_rank": 0,
26
+ "model_version": 1,
27
+ "outlier_channel_split": false,
28
+ "packsz": 2,
29
+ "rescale_WH": false,
30
+ "resid_scale_override": 3.45
31
+ },
32
+ "rms_norm_eps": 1e-05,
33
+ "rope_scaling": null,
34
+ "rope_theta": 10000.0,
35
+ "tie_word_embeddings": false,
36
+ "torch_dtype": "float16",
37
+ "transformers_version": "4.34.0",
38
+ "use_cache": true,
39
+ "vocab_size": 32000
40
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.34.0"
6
+ }
model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d17d0418031aa49c26205d49e118d07cc0358d9340d370abc4f1b0da93560e3
3
+ size 9974731824
model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e062d1fd2349e8b5caecc7e2f0d14e8bcecf262069db2fc22a3e81d0e42b23ef
3
+ size 9991907352
model-00003-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d585b1fcd2399bd89e24e6fdd63b408cc8e520c4feedf4944d696b7b8504b7ce
3
+ size 9855492946
model-00004-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc9f1b5886da1f6130cf8b0427dc00d6f7c1b7e85d8f3551e82ea9dca66bd23d
3
+ size 3630379158
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff