Training in progress, step 10000

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +153 -3
pytorch_model.bin +1 -1
runs/Jan26_03-13-45_b3489f7155a5/events.out.tfevents.1674703022.b3489f7155a5.24.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8246a7bdffa31a2780601cff44a208fa66a42423f08dc44f96fc441f90dcd063
 size 1115513717

 version https://git-lfs.github.com/spec/v1
+oid sha256:0270219bbf3b9d435456104809f3c23a41c4cd1fe51a03b95efb36b90021a044
 size 1115513717

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0f6ee17edbe5be6c0db0fc26e011e3cfca90c6d942052701e91b647fb79172d
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b3509860f8b9090ce37e24daf382d92def3c20605929d105fc7709bfdf4fa92
 size 557969145

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c55dab6106e884ae561d5ed424b58463798e65d5293313f2bcf0598e4e0cd039
 size 15523

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bd78237a8bff2399c24e5136a001794a3e1c14fbfcbde9fa5704a4fcf3d3828
 size 15523

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:007eb7be8567224005d4825ac66cab713ae55402dc507574403696925ab53db1
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc6cc4eff0bedca1e1ffd7c8824dc4da7fe034832dbf96d075af2be5a88f8f30
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8613759044446997,
-  "global_step": 7500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -456,11 +456,161 @@
       "learning_rate": 2.60735022012378e-05,
       "loss": 0.6286,
       "step": 7500
     }
   ],
   "max_steps": 15673,
   "num_train_epochs": 2,
-  "total_flos": 2.969453707444224e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.1485012059262663,
+  "global_step": 10000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.60735022012378e-05,
       "loss": 0.6286,
       "step": 7500
+    },
+    {
+      "epoch": 0.87,
+      "learning_rate": 2.5754482230587633e-05,
+      "loss": 0.6284,
+      "step": 7600
+    },
+    {
+      "epoch": 0.88,
+      "learning_rate": 2.5435462259937474e-05,
+      "loss": 0.6169,
+      "step": 7700
+    },
+    {
+      "epoch": 0.9,
+      "learning_rate": 2.5116442289287312e-05,
+      "loss": 0.6334,
+      "step": 7800
+    },
+    {
+      "epoch": 0.91,
+      "learning_rate": 2.4797422318637146e-05,
+      "loss": 0.6573,
+      "step": 7900
+    },
+    {
+      "epoch": 0.92,
+      "learning_rate": 2.4478402347986984e-05,
+      "loss": 0.6026,
+      "step": 8000
+    },
+    {
+      "epoch": 0.93,
+      "learning_rate": 2.4159382377336822e-05,
+      "loss": 0.6836,
+      "step": 8100
+    },
+    {
+      "epoch": 0.94,
+      "learning_rate": 2.384036240668666e-05,
+      "loss": 0.6093,
+      "step": 8200
+    },
+    {
+      "epoch": 0.95,
+      "learning_rate": 2.3521342436036498e-05,
+      "loss": 0.6603,
+      "step": 8300
+    },
+    {
+      "epoch": 0.96,
+      "learning_rate": 2.3202322465386332e-05,
+      "loss": 0.6312,
+      "step": 8400
+    },
+    {
+      "epoch": 0.98,
+      "learning_rate": 2.2883302494736173e-05,
+      "loss": 0.6312,
+      "step": 8500
+    },
+    {
+      "epoch": 0.99,
+      "learning_rate": 2.2564282524086008e-05,
+      "loss": 0.6278,
+      "step": 8600
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 2.224526255343585e-05,
+      "loss": 0.6115,
+      "step": 8700
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 2.1926242582785683e-05,
+      "loss": 0.6666,
+      "step": 8800
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 2.160722261213552e-05,
+      "loss": 0.6047,
+      "step": 8900
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 2.128820264148536e-05,
+      "loss": 0.6174,
+      "step": 9000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 2.0969182670835193e-05,
+      "loss": 0.5977,
+      "step": 9100
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 2.0650162700185034e-05,
+      "loss": 0.553,
+      "step": 9200
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 2.033114272953487e-05,
+      "loss": 0.6447,
+      "step": 9300
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 2.0012122758884706e-05,
+      "loss": 0.5979,
+      "step": 9400
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 1.9693102788234544e-05,
+      "loss": 0.6234,
+      "step": 9500
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 1.9374082817584382e-05,
+      "loss": 0.5939,
+      "step": 9600
+    },
+    {
+      "epoch": 1.11,
+      "learning_rate": 1.905506284693422e-05,
+      "loss": 0.6481,
+      "step": 9700
+    },
+    {
+      "epoch": 1.13,
+      "learning_rate": 1.8736042876284058e-05,
+      "loss": 0.592,
+      "step": 9800
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 1.8417022905633892e-05,
+      "loss": 0.6491,
+      "step": 9900
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 1.8098002934983733e-05,
+      "loss": 0.5978,
+      "step": 10000
     }
   ],
   "max_steps": 15673,
   "num_train_epochs": 2,
+  "total_flos": 3.954111338032128e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0f6ee17edbe5be6c0db0fc26e011e3cfca90c6d942052701e91b647fb79172d
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b3509860f8b9090ce37e24daf382d92def3c20605929d105fc7709bfdf4fa92
 size 557969145

runs/Jan26_03-13-45_b3489f7155a5/events.out.tfevents.1674703022.b3489f7155a5.24.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1e19a8b9d0aee47e4149819f08638c1d2effc4c31ead54c6fa4747637024e00
-size 16610

 version https://git-lfs.github.com/spec/v1
+oid sha256:e582d90f7535fdd56e7dc87ed69608bed0f439782a1664c33152ca1b8568bf2f
+size 20535