Upload 15 files

Files changed (15) hide show

config.json ADDED Viewed

+{
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 12288,
+  "initializer_range": 0.02,
+  "intermediate_size": 28672,
+  "max_position_embeddings": 32768,
+  "model_type": "mistral",
+  "num_attention_heads": 96,
+  "num_hidden_layers": 88,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 1000000.0,
+  "sliding_window": null,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.42.3",
+  "use_cache": true,
+  "vocab_size": 32768
+}

generation_config.json ADDED Viewed

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.42.3"
+}

output-00001-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:555e2cfc9a1b4fb29cf92d1e651f05477b6c3c7770f4a4f586fbcbff967c3c29
+size 8578360014

output-00002-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d0e766d1165a4f18b24fa192b25928622899e5794e70381b1a9f37e778ef8b7
+size 8454161966

output-00003-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5d2ed1fd5995593746bdc62594d2b227c2dbd82c0363488e05baee3e9696797
+size 8482966348

output-00004-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a22231800254be6b17f6d63f4887b49477e7375ea32e901f8ce0dca720146fb9
+size 8437961732

output-00005-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3015907b5905e56241a2867b5afe06a5203af4309475b1024af04a00feb8fd0f
+size 8586745704

output-00006-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e989c55fb4b2199d829df25dbe203b2863c4a2377d5678a0d6a5aadb0a6dfeef
+size 8550993000

output-00007-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a567fe629ac087fce04b81c868d580ccfd013aee679128bd7beed69aceecb7d3
+size 8429247308

output-00008-of-00008.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:40cd4b935e2a919fe3f379b0bbf16fc4edf27f3fa736ad1bb76098bd279a4e77
+size 2504344804

params.json ADDED Viewed

+{
+    "dim": 12288,
+    "n_layers": 88,
+    "head_dim": 128,
+    "hidden_dim": 28672,
+    "n_heads": 96,
+    "n_kv_heads": 8,
+    "norm_eps": 1e-05,
+    "vocab_size": 32768,
+    "rope_theta": 1000000.0
+}

test.py ADDED Viewed

+import json
+from typing import Dict
+from safetensors.torch import load_file, save_file
+from huggingface_hub import split_torch_state_dict_into_shards
+import torch
+import os
+def save_state_dict(state_dict: Dict[str, torch.Tensor], save_directory: str):
+    state_dict_split = split_torch_state_dict_into_shards(state_dict, filename_pattern='consolidated{suffix}.safetensors')
+    for filename, tensors in state_dict_split.filename_to_tensors.items():
+        shard = {tensor: state_dict[tensor] for tensor in tensors}
+        print("Saving", save_directory, filename)
+        save_file(shard, os.path.join(save_directory, filename))
+    if state_dict_split.is_sharded:
+        index = {
+            "metadata": state_dict_split.metadata,
+            "weight_map": state_dict_split.tensor_to_filename,
+        }
+        with open(os.path.join(save_directory, "consolidated.safetensors.index.json"), "w") as f:
+            f.write(json.dumps(index, indent=2))
+big_file = 'consolidated.safetensors'
+loaded = load_file(big_file)
+save_state_dict(loaded, save_directory=f'.')

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model.v3 ADDED Viewed

Binary file (588 kB). View file

tokenizer_config.json ADDED Viewed

The diff for this file is too large to render. See raw diff