lukeleeai commited on
Commit
b7a49aa
·
verified ·
1 Parent(s): de9dd17

End of training

Browse files
Files changed (3) hide show
  1. README.md +3 -3
  2. config.json +3 -3
  3. model.safetensors +1 -1
README.md CHANGED
@@ -2,18 +2,18 @@
2
  tags:
3
  - generated_from_trainer
4
  model-index:
5
- - name: sparse_llama_debugging_refined_web_90p_debugging_2024-03-21
6
  results: []
7
  ---
8
 
9
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
10
  should probably proofread and complete it, then remove this comment. -->
11
 
12
- # sparse_llama_debugging_refined_web_90p_debugging_2024-03-21
13
 
14
  This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
15
  It achieves the following results on the evaluation set:
16
- - Loss: 10.3835
17
 
18
  ## Model description
19
 
 
2
  tags:
3
  - generated_from_trainer
4
  model-index:
5
+ - name: sparse_llama_7b_refined_web_90p_debugging_2024-03-21
6
  results: []
7
  ---
8
 
9
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
10
  should probably proofread and complete it, then remove this comment. -->
11
 
12
+ # sparse_llama_7b_refined_web_90p_debugging_2024-03-21
13
 
14
  This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 10.3854
17
 
18
  ## Model description
19
 
config.json CHANGED
@@ -24,10 +24,10 @@
24
  "rope_scaling": null,
25
  "rope_theta": 10000.0,
26
  "thresholds": [
 
27
  0.12938815355300903,
28
- 0.12938815355300903,
29
- 0.1313941776752472,
30
- 0.12337010353803635
31
  ],
32
  "tie_word_embeddings": false,
33
  "torch_dtype": "float32",
 
24
  "rope_scaling": null,
25
  "rope_theta": 10000.0,
26
  "thresholds": [
27
+ 0.1253761202096939,
28
  0.12938815355300903,
29
+ 0.12738214433193207,
30
+ 0.12938815355300903
 
31
  ],
32
  "tie_word_embeddings": false,
33
  "torch_dtype": "float32",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6d65535cc9b9fb7093e5694f896267ee8cf27784649db01dddd983548751290
3
  size 16849208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b9b881a4f5b50ab5ac0dddd75304c1cde45fbb24c33d519c37ae29f5430eaca
3
  size 16849208