Training in progress, step 39, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b0a97ccfa72c39621a5fbbc20bb25f98ee1e332fbd96861281255b0240bf39e
 size 36981072

 version https://git-lfs.github.com/spec/v1
+oid sha256:122a7b3af0e0a60bac97552ab32f84563eb31164e9a1bb9120d1b19176ef0f10
 size 36981072

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:507d25898c9bef0156384c4e8f389d97f3251b9939d927303b2cb00579667edf
 size 19859140

 version https://git-lfs.github.com/spec/v1
+oid sha256:deb5320aeabcdaaab9038235f6dd9e4e261b4f7be12e01909661e93b1f3bc460
 size 19859140

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:90d14217b9aab4afc34bce8881096a848de30c1e82c9da12bc5a58ed5b303046
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee0d25207b91073ecb1d8a246fff2f3dfd714db66536f34092c31ccf8ef9581c
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:37841e69eda911caeb33edeefa0b2f140e72dcce247aeb757b2fe89c00d7887b
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c50dbaa792cda4a28fbbc2acb2a3e03c59530712bbc5107212d33064d193da4
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.021711899791231733,
   "eval_steps": 10,
-  "global_step": 26,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -66,6 +66,28 @@
       "learning_rate": 6.91341716182545e-05,
       "loss": 0.4975,
       "step": 25
     }
   ],
   "logging_steps": 5,
@@ -85,7 +107,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 859390385061888.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.0325678496868476,
   "eval_steps": 10,
+  "global_step": 39,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 6.91341716182545e-05,
       "loss": 0.4975,
       "step": 25
+    },
+    {
+      "epoch": 0.025052192066805846,
+      "grad_norm": 0.8014892935752869,
+      "learning_rate": 5e-05,
+      "loss": 0.4266,
+      "step": 30
+    },
+    {
+      "epoch": 0.025052192066805846,
+      "eval_loss": 0.43505820631980896,
+      "eval_runtime": 23.9252,
+      "eval_samples_per_second": 21.107,
+      "eval_steps_per_second": 10.575,
+      "step": 30
+    },
+    {
+      "epoch": 0.029227557411273485,
+      "grad_norm": 0.7463769912719727,
+      "learning_rate": 3.086582838174551e-05,
+      "loss": 0.405,
+      "step": 35
     }
   ],
   "logging_steps": 5,
       "attributes": {}
     }
   },
+  "total_flos": 1305300490518528.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null