Training in progress, step 3980, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:65fb83a9c29de4d7e06afb8b3d4a0bc435a164c5edf7e6c2fa23710ae1a60ce7
 size 281587880

 version https://git-lfs.github.com/spec/v1
+oid sha256:7057efa04f84d06fb8967e215cd3ed4e982d7324a9964d6bbddac5f0e932d7f5
 size 281587880

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4823923d11463c6c19d97e755766c27ce38303eafe89ab5ada265bab0bbe5b90
 size 143366164

 version https://git-lfs.github.com/spec/v1
+oid sha256:9e1eb62a18526c2a140b51e8df453f354efe9fff401a06b4a4b58ee9618117dd
 size 143366164

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f2c5c72e32ad22e8d120f7d7edf6daaf711756d9fa00a36d422ea40f0caa191
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:fc3697b212f20146262137e7c1a969576663ccc4ae69304edc36288b1d18cfd1
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5a4dc5a674fde8d2c06fe93bf7b2c8667a033dd0cbccf2a677c1b9887cba0ce7
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:5b9e6d31c8b9ec88e33f75ea2e1485990411f6bd2ad3eadb72c07fb2ff77cc4a
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6997093fbcc5f6569002def419d62b598060366c7db5d40180535218354720a5
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:3d078af19d6439842c947502bac22108599fc2ee9fcd36b51d3f5f8765f9e42c
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:283b6a005aa2ecb118df9e93de7151dbb618e242f2d6010fe353df775799e7ec
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:5982284510275852c78aa2d02bd147d4856df83b4bf467c5c077c2680e8271c0
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f76715176eec92c229f6a6975d3c1c21d42bfd2d495770679a8163b6cacae4f
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0a4ea943eff6a00a0d44284eab894bea8fb50f7f4cf9fce50a355f53053d12e
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:49d72a006b11c9543e4141388b8b2e62469fa2ee739d4203b7b31cbc2cbcf83c
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:ae334b3ce7770bc0260e90dc8782002eb4f829e4a83cf87989a3bcab2ddad5aa
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8be4774a72fd8902031956bbdc9def78b6c03abe70c3345a6e2e97d7a94e0a46
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:cec5f6de25d29de2f1bb3c4f3529450759465854bf2202d64d33659c58ee0a0e
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e2357a748cc633ba04296ecae8c5fe4fa41bfcea06d4a3d0adec5d176c84c343
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd393c8d7b7d37049aa33eaacfe9ea78417f491646acb1001289f2f04bc216ff
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:29ed43ed763944b1379237a172f715de83b2736df81605a2b7bca80685584747
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:e374cd16ce446630eb5de7b6aef11f861ca1227fccdd18be31c30ca89d07e197
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 99.0,
   "eval_steps": 40,
-  "global_step": 3960,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -3579,6 +3579,20 @@
       "eval_samples_per_second": 110.154,
       "eval_steps_per_second": 15.299,
       "step": 3960
     }
   ],
   "logging_steps": 10,
@@ -3598,7 +3612,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.6672394960909107e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 99.5,
   "eval_steps": 40,
+  "global_step": 3980,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 110.154,
       "eval_steps_per_second": 15.299,
       "step": 3960
+    },
+    {
+      "epoch": 99.25,
+      "grad_norm": 1.4808772903052159e-05,
+      "learning_rate": 2.8093068117240885e-08,
+      "loss": 0.0,
+      "step": 3970
+    },
+    {
+      "epoch": 99.5,
+      "grad_norm": 1.7599566490389407e-05,
+      "learning_rate": 1.2486132855826781e-08,
+      "loss": 0.0,
+      "step": 3980
     }
   ],
   "logging_steps": 10,
       "attributes": {}
     }
   },
+  "total_flos": 1.6756598975863194e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null