AnkurGupta1 commited on
Commit
f44da9f
·
verified ·
1 Parent(s): af1c596

End of training

Browse files
README.md CHANGED
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [microsoft/Phi-3-mini-128k-instruct](https://huggingface.co/microsoft/Phi-3-mini-128k-instruct) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 2.1499
22
 
23
  ## Model description
24
 
@@ -53,11 +53,11 @@ The following hyperparameters were used during training:
53
 
54
  | Training Loss | Epoch | Step | Validation Loss |
55
  |:-------------:|:-----:|:----:|:---------------:|
56
- | 2.0996 | 0.4 | 2 | 2.2203 |
57
- | 2.1578 | 0.8 | 4 | 2.1806 |
58
- | 1.9713 | 1.2 | 6 | 2.1613 |
59
- | 2.067 | 1.6 | 8 | 2.1525 |
60
- | 1.8717 | 2.0 | 10 | 2.1499 |
61
 
62
 
63
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [microsoft/Phi-3-mini-128k-instruct](https://huggingface.co/microsoft/Phi-3-mini-128k-instruct) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 2.5556
22
 
23
  ## Model description
24
 
 
53
 
54
  | Training Loss | Epoch | Step | Validation Loss |
55
  |:-------------:|:-----:|:----:|:---------------:|
56
+ | 2.4798 | 0.4 | 2 | 2.6784 |
57
+ | 2.5949 | 0.8 | 4 | 2.6066 |
58
+ | 2.3319 | 1.2 | 6 | 2.5751 |
59
+ | 2.5069 | 1.6 | 8 | 2.5597 |
60
+ | 2.2803 | 2.0 | 10 | 2.5556 |
61
 
62
 
63
  ### Framework versions
adapter_config.json CHANGED
@@ -22,8 +22,8 @@
22
  "target_modules": [
23
  "v_proj",
24
  "q_proj",
25
- "o_proj",
26
- "k_proj"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
 
22
  "target_modules": [
23
  "v_proj",
24
  "q_proj",
25
+ "k_proj",
26
+ "o_proj"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:899d386e4d3e5c7392b2b6e38e49b2e01b932405f9bcaaa565cfa653c07322ec
3
  size 12591456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:192c22047f638b7bd795006bcb9052d96a113e2118b11dcb925514d672a00438
3
  size 12591456
runs/Jun01_10-27-47_2303b76e0112/events.out.tfevents.1717237668.2303b76e0112.20343.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:228a9c6ecf5c84881390e2a46c812380b7b3eb4889ea7adc881ddfab93851a16
3
+ size 11881
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 128,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08ab11c6985f9b623509d624b9dceb862ebec5d2c2b4d2782dfd3ddf62255fdc
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fa946ac499622d1737b53c65feedf16d367bf2ffeb4dcffff1f8a38fb2683e5
3
  size 5112