Training in progress, step 15000

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +153 -3
pytorch_model.bin +1 -1
runs/Jan26_03-13-45_b3489f7155a5/events.out.tfevents.1674703022.b3489f7155a5.24.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fcf16c77fc4c696d5ecec66bb94ab1a72596ecc42da185a1509a0a37aa93d820
 size 1115513717

 version https://git-lfs.github.com/spec/v1
+oid sha256:38bbc7cd108d4066f57dece94d18666a0619186fb83ead8f178ba5374f85c4d4
 size 1115513717

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:001276adc811be2b4e3383d1bfd82644ee01b63c562240704981e80abf57ea78
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:7b3390a170051de185cec86c8c4131be12aeb79afd4f2697385bcd3c5fe72132
 size 557969145

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ea4cb9a85921bdde5a8523300b183bff3f70a1aeb0368e6a4c669b696d1922c
 size 15523

 version https://git-lfs.github.com/spec/v1
+oid sha256:4d8425ca758719b66e03746ec5ac1a9a95c444f7ea14cfc4567c5f50fa51c740
 size 15523

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af29429f2a56160c0a3cb3b03c7b28cc9e5f472234bebefa86da284747a0d6d1
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:03778c2e3b15a96003ceff9d06ee5b9ecdadc81dcfa36477cad7912647bf1ff9
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.4356265074078327,
-  "global_step": 12500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -756,11 +756,161 @@
       "learning_rate": 1.0122503668729662e-05,
       "loss": 0.6705,
       "step": 12500
     }
   ],
   "max_steps": 15673,
   "num_train_epochs": 2,
-  "total_flos": 4.939903709604864e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.7227518088893994,
+  "global_step": 15000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.0122503668729662e-05,
       "loss": 0.6705,
       "step": 12500
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 9.8034836980795e-06,
+      "loss": 0.5761,
+      "step": 12600
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 9.484463727429338e-06,
+      "loss": 0.5709,
+      "step": 12700
+    },
+    {
+      "epoch": 1.47,
+      "learning_rate": 9.165443756779176e-06,
+      "loss": 0.562,
+      "step": 12800
+    },
+    {
+      "epoch": 1.48,
+      "learning_rate": 8.846423786129014e-06,
+      "loss": 0.6113,
+      "step": 12900
+    },
+    {
+      "epoch": 1.49,
+      "learning_rate": 8.52740381547885e-06,
+      "loss": 0.6137,
+      "step": 13000
+    },
+    {
+      "epoch": 1.5,
+      "learning_rate": 8.208383844828686e-06,
+      "loss": 0.5669,
+      "step": 13100
+    },
+    {
+      "epoch": 1.52,
+      "learning_rate": 7.889363874178523e-06,
+      "loss": 0.6175,
+      "step": 13200
+    },
+    {
+      "epoch": 1.53,
+      "learning_rate": 7.570343903528361e-06,
+      "loss": 0.6069,
+      "step": 13300
+    },
+    {
+      "epoch": 1.54,
+      "learning_rate": 7.251323932878198e-06,
+      "loss": 0.5949,
+      "step": 13400
+    },
+    {
+      "epoch": 1.55,
+      "learning_rate": 6.932303962228036e-06,
+      "loss": 0.6207,
+      "step": 13500
+    },
+    {
+      "epoch": 1.56,
+      "learning_rate": 6.613283991577873e-06,
+      "loss": 0.596,
+      "step": 13600
+    },
+    {
+      "epoch": 1.57,
+      "learning_rate": 6.294264020927711e-06,
+      "loss": 0.5972,
+      "step": 13700
+    },
+    {
+      "epoch": 1.58,
+      "learning_rate": 5.975244050277548e-06,
+      "loss": 0.6127,
+      "step": 13800
+    },
+    {
+      "epoch": 1.6,
+      "learning_rate": 5.6562240796273845e-06,
+      "loss": 0.6214,
+      "step": 13900
+    },
+    {
+      "epoch": 1.61,
+      "learning_rate": 5.337204108977222e-06,
+      "loss": 0.6009,
+      "step": 14000
+    },
+    {
+      "epoch": 1.62,
+      "learning_rate": 5.018184138327059e-06,
+      "loss": 0.628,
+      "step": 14100
+    },
+    {
+      "epoch": 1.63,
+      "learning_rate": 4.699164167676897e-06,
+      "loss": 0.6096,
+      "step": 14200
+    },
+    {
+      "epoch": 1.64,
+      "learning_rate": 4.380144197026735e-06,
+      "loss": 0.5396,
+      "step": 14300
+    },
+    {
+      "epoch": 1.65,
+      "learning_rate": 4.061124226376571e-06,
+      "loss": 0.554,
+      "step": 14400
+    },
+    {
+      "epoch": 1.67,
+      "learning_rate": 3.7421042557264087e-06,
+      "loss": 0.5867,
+      "step": 14500
+    },
+    {
+      "epoch": 1.68,
+      "learning_rate": 3.423084285076246e-06,
+      "loss": 0.584,
+      "step": 14600
+    },
+    {
+      "epoch": 1.69,
+      "learning_rate": 3.1040643144260834e-06,
+      "loss": 0.587,
+      "step": 14700
+    },
+    {
+      "epoch": 1.7,
+      "learning_rate": 2.7850443437759203e-06,
+      "loss": 0.605,
+      "step": 14800
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 2.4660243731257577e-06,
+      "loss": 0.5905,
+      "step": 14900
+    },
+    {
+      "epoch": 1.72,
+      "learning_rate": 2.147004402475595e-06,
+      "loss": 0.6208,
+      "step": 15000
     }
   ],
   "max_steps": 15673,
   "num_train_epochs": 2,
+  "total_flos": 5.929193491393536e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:001276adc811be2b4e3383d1bfd82644ee01b63c562240704981e80abf57ea78
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:7b3390a170051de185cec86c8c4131be12aeb79afd4f2697385bcd3c5fe72132
 size 557969145

runs/Jan26_03-13-45_b3489f7155a5/events.out.tfevents.1674703022.b3489f7155a5.24.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f77dd77e2e1de62f98d722747a220a5ac16ebff7589985b9d63fb7e5c44b6c35
-size 24460

 version https://git-lfs.github.com/spec/v1
+oid sha256:42156792ecc5fb337e2c5b5d1ed6fdc0fe4bf653273b9d8e8c643e6dabea8931
+size 28385