Training in progress, step 12500

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +153 -3
pytorch_model.bin +1 -1
runs/Jan01_04-28-26_6ea5fb75c867/events.out.tfevents.1672547319.6ea5fb75c867.24.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:695ea22c16d59b8f8e7d8bcd0620d0c0f0cb7c3578a0fb43c564437f3ba1279f
 size 1115513717

 version https://git-lfs.github.com/spec/v1
+oid sha256:3fa988a042b2cdca0db941098a7b0889a7f6ef2a60d3c2eecc5665835671501f
 size 1115513717

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73a52c17999eaef626df679c5f03ad9c53b61713db7706f9c3432222c1b6c6a3
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:24bd601333f9b24ae84ddecb08d08fa20af94e90b0ef9fe6d30560e699c3000f
 size 557969145

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9e5f8f9f68a550cc99dfdaed2042005f3b6ddc4eafa0827c34c6b5a1e335d304
 size 15523

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f4192ba426584b0e6f477cc4c524f9890045d0a7e9f4c59e75fdc81e08123b7
 size 15523

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d52951fc965683e697127d8227f41545dee9b14abb397312476c1d018a09dfd
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:d2094fcc97958c7c57904b53d4a0a0469e8a2a4a35877adb27094a24fdfc3798
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.149029070435482,
-  "global_step": 10000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -606,11 +606,161 @@
       "learning_rate": 1.8083748244606157e-05,
       "loss": 2.3654,
       "step": 10000
     }
   ],
   "max_steps": 15666,
   "num_train_epochs": 2,
-  "total_flos": 3.953048407805952e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.4362863380443525,
+  "global_step": 12500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.8083748244606157e-05,
       "loss": 2.3654,
       "step": 10000
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 1.7764585727052216e-05,
+      "loss": 2.3825,
+      "step": 10100
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 1.7445423209498275e-05,
+      "loss": 2.3245,
+      "step": 10200
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 1.712626069194434e-05,
+      "loss": 2.2869,
+      "step": 10300
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 1.68070981743904e-05,
+      "loss": 2.3207,
+      "step": 10400
+    },
+    {
+      "epoch": 1.21,
+      "learning_rate": 1.648793565683646e-05,
+      "loss": 2.3041,
+      "step": 10500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.6168773139282523e-05,
+      "loss": 2.3543,
+      "step": 10600
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.5849610621728586e-05,
+      "loss": 2.3026,
+      "step": 10700
+    },
+    {
+      "epoch": 1.24,
+      "learning_rate": 1.553044810417465e-05,
+      "loss": 2.2919,
+      "step": 10800
+    },
+    {
+      "epoch": 1.25,
+      "learning_rate": 1.5211285586620708e-05,
+      "loss": 2.3805,
+      "step": 10900
+    },
+    {
+      "epoch": 1.26,
+      "learning_rate": 1.4892123069066769e-05,
+      "loss": 2.3523,
+      "step": 11000
+    },
+    {
+      "epoch": 1.28,
+      "learning_rate": 1.4572960551512832e-05,
+      "loss": 2.2931,
+      "step": 11100
+    },
+    {
+      "epoch": 1.29,
+      "learning_rate": 1.4253798033958893e-05,
+      "loss": 2.2623,
+      "step": 11200
+    },
+    {
+      "epoch": 1.3,
+      "learning_rate": 1.3934635516404954e-05,
+      "loss": 2.28,
+      "step": 11300
+    },
+    {
+      "epoch": 1.31,
+      "learning_rate": 1.3615472998851015e-05,
+      "loss": 2.3121,
+      "step": 11400
+    },
+    {
+      "epoch": 1.32,
+      "learning_rate": 1.3296310481297078e-05,
+      "loss": 2.3111,
+      "step": 11500
+    },
+    {
+      "epoch": 1.33,
+      "learning_rate": 1.2977147963743139e-05,
+      "loss": 2.332,
+      "step": 11600
+    },
+    {
+      "epoch": 1.34,
+      "learning_rate": 1.26579854461892e-05,
+      "loss": 2.3495,
+      "step": 11700
+    },
+    {
+      "epoch": 1.36,
+      "learning_rate": 1.233882292863526e-05,
+      "loss": 2.2864,
+      "step": 11800
+    },
+    {
+      "epoch": 1.37,
+      "learning_rate": 1.2019660411081324e-05,
+      "loss": 2.3482,
+      "step": 11900
+    },
+    {
+      "epoch": 1.38,
+      "learning_rate": 1.1700497893527385e-05,
+      "loss": 2.2843,
+      "step": 12000
+    },
+    {
+      "epoch": 1.39,
+      "learning_rate": 1.1381335375973447e-05,
+      "loss": 2.3075,
+      "step": 12100
+    },
+    {
+      "epoch": 1.4,
+      "learning_rate": 1.1062172858419507e-05,
+      "loss": 2.3899,
+      "step": 12200
+    },
+    {
+      "epoch": 1.41,
+      "learning_rate": 1.074301034086557e-05,
+      "loss": 2.3496,
+      "step": 12300
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 1.042384782331163e-05,
+      "loss": 2.3482,
+      "step": 12400
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.0104685305757693e-05,
+      "loss": 2.2579,
+      "step": 12500
     }
   ],
   "max_steps": 15666,
   "num_train_epochs": 2,
+  "total_flos": 4.940417519751168e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73a52c17999eaef626df679c5f03ad9c53b61713db7706f9c3432222c1b6c6a3
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:24bd601333f9b24ae84ddecb08d08fa20af94e90b0ef9fe6d30560e699c3000f
 size 557969145

runs/Jan01_04-28-26_6ea5fb75c867/events.out.tfevents.1672547319.6ea5fb75c867.24.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f511a742a4b5f180697e41094bff1017383d78f0e31e1610835895acb5b91dcc
-size 20535

 version https://git-lfs.github.com/spec/v1
+oid sha256:b418208d85d0b6e99ed4edaaf8699502243c81bf86dcb36a87f1a130a498c62a
+size 24460