tuanna08go commited on
Commit
45b451e
·
verified ·
1 Parent(s): 3d09ed0

Training in progress, step 18, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a187a7a11dd6a27072e285072042a649c8028a4687fed6282575a943513dd3be
3
  size 36981072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13fe05a92754b8bef955406ff78f460e177504adaf486448c33bc0b8e389d46a
3
  size 36981072
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f990261de2855ce31f884f8bfe37b02e49b2d66175aa902b1f3b638917e25446
3
  size 19859140
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fc7de28f21a93c715580535bc1a5f1a2dc06418b3e56b33ffa800892140dc93
3
  size 19859140
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30f7f8c32b023f47232c3c926ef5ae8543f8a77cbf64c31de880f8288599f625
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a14c492499077a4c95e201e5027fa03e78d18afdffa28e19e530c9a797cfacc0
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbd37f4723efc302d162f450f29ed4f7093ff324d3bd36b0e678a3163e9abf68
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10e175ebe60f1a6bbd43d635188097fdd53bf710ff976db3f946328fc19cf4ba
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5549132947976878,
5
  "eval_steps": 5,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -38,6 +38,14 @@
38
  "eval_samples_per_second": 51.607,
39
  "eval_steps_per_second": 6.716,
40
  "step": 10
 
 
 
 
 
 
 
 
41
  }
42
  ],
43
  "logging_steps": 10,
@@ -57,7 +65,7 @@
57
  "attributes": {}
58
  }
59
  },
60
- "total_flos": 6226526563467264.0,
61
  "train_batch_size": 8,
62
  "trial_name": null,
63
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8323699421965318,
5
  "eval_steps": 5,
6
+ "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
38
  "eval_samples_per_second": 51.607,
39
  "eval_steps_per_second": 6.716,
40
  "step": 10
41
+ },
42
+ {
43
+ "epoch": 0.6936416184971098,
44
+ "eval_loss": 7.122732639312744,
45
+ "eval_runtime": 2.9017,
46
+ "eval_samples_per_second": 50.316,
47
+ "eval_steps_per_second": 6.548,
48
+ "step": 15
49
  }
50
  ],
51
  "logging_steps": 10,
 
65
  "attributes": {}
66
  }
67
  },
68
+ "total_flos": 9339789845200896.0,
69
  "train_batch_size": 8,
70
  "trial_name": null,
71
  "trial_params": null