awsuineg commited on
Commit
a008dc7
·
verified ·
1 Parent(s): 94462c6

Model save

Browse files
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "down_proj",
24
- "k_proj",
25
- "v_proj",
26
- "up_proj",
27
  "o_proj",
 
28
  "gate_proj",
29
- "q_proj"
 
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
 
23
  "o_proj",
24
+ "q_proj",
25
  "gate_proj",
26
+ "v_proj",
27
+ "down_proj",
28
+ "k_proj",
29
+ "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
all_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 1.1487027058043781e+19,
4
- "train_loss": 0.8902242264134556,
5
- "train_runtime": 34738.9702,
6
  "train_samples": 207864,
7
- "train_samples_per_second": 3.992,
8
- "train_steps_per_second": 0.166
9
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 1.1487027058043781e+19,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 0.0169,
6
  "train_samples": 207864,
7
+ "train_samples_per_second": 8184133.024,
8
+ "train_steps_per_second": 341027.672
9
  }
runs/Nov18_09-06-30_d28f7adca72c/events.out.tfevents.1731920841.d28f7adca72c.1609162.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8319038ea07c5da8c1ca7771696a58956a792eef296dcd151f6d4fed81baafa
3
+ size 6998
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 1.1487027058043781e+19,
4
- "train_loss": 0.8902242264134556,
5
- "train_runtime": 34738.9702,
6
  "train_samples": 207864,
7
- "train_samples_per_second": 3.992,
8
- "train_steps_per_second": 0.166
9
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 1.1487027058043781e+19,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 0.0169,
6
  "train_samples": 207864,
7
+ "train_samples_per_second": 8184133.024,
8
+ "train_steps_per_second": 341027.672
9
  }
trainer_state.json CHANGED
@@ -8100,22 +8100,14 @@
8100
  "loss": 0.8886,
8101
  "step": 5775
8102
  },
8103
- {
8104
- "epoch": 1.0,
8105
- "eval_loss": 0.9683669805526733,
8106
- "eval_runtime": 1122.8206,
8107
- "eval_samples_per_second": 13.671,
8108
- "eval_steps_per_second": 0.57,
8109
- "step": 5779
8110
- },
8111
  {
8112
  "epoch": 1.0,
8113
  "step": 5779,
8114
  "total_flos": 1.1487027058043781e+19,
8115
- "train_loss": 0.8902242264134556,
8116
- "train_runtime": 34738.9702,
8117
- "train_samples_per_second": 3.992,
8118
- "train_steps_per_second": 0.166
8119
  }
8120
  ],
8121
  "logging_steps": 5,
 
8100
  "loss": 0.8886,
8101
  "step": 5775
8102
  },
 
 
 
 
 
 
 
 
8103
  {
8104
  "epoch": 1.0,
8105
  "step": 5779,
8106
  "total_flos": 1.1487027058043781e+19,
8107
+ "train_loss": 0.0,
8108
+ "train_runtime": 0.0169,
8109
+ "train_samples_per_second": 8184133.024,
8110
+ "train_steps_per_second": 341027.672
8111
  }
8112
  ],
8113
  "logging_steps": 5,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f37293628d10e47961ded5c449d8942fe36a719860387f0553788b63228638f
3
  size 6328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82763ac4d1451da25c7cb359dd9ee2581f99c3d2b8db998d96375db407c0978e
3
  size 6328