sedrickkeh
commited on
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65ebd31bd5f7e516dc101d45d664fd4990c434272129c5880c53ade2705b0dc0
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8631719aee68f22ae179b0eff86ef848918d1bac56f6e6e7cc6f0f3f75c5ad12
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab3c87e5399be82d2d32e12b6b5fa550fcf95a8dba6be60f25a43f717af0a583
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57d2e9f288724923b965f7185c9cd69b90e3f7b1ccd679b8bbad64f58d85604b
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -88,3 +88,46 @@
|
|
88 |
{"current_steps": 870, "total_steps": 1314, "loss": 0.5987, "learning_rate": 1.7650226633779838e-06, "epoch": 1.9834757834757835, "percentage": 66.21, "elapsed_time": "12:50:20", "remaining_time": "6:33:08"}
|
89 |
{"current_steps": 877, "total_steps": 1314, "eval_loss": 0.6201021671295166, "epoch": 1.9994301994301993, "percentage": 66.74, "elapsed_time": "13:03:48", "remaining_time": "6:30:33"}
|
90 |
{"current_steps": 880, "total_steps": 1314, "loss": 0.6215, "learning_rate": 1.7144163926130621e-06, "epoch": 2.006837606837607, "percentage": 66.97, "elapsed_time": "13:07:32", "remaining_time": "6:28:23"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
88 |
{"current_steps": 870, "total_steps": 1314, "loss": 0.5987, "learning_rate": 1.7650226633779838e-06, "epoch": 1.9834757834757835, "percentage": 66.21, "elapsed_time": "12:50:20", "remaining_time": "6:33:08"}
|
89 |
{"current_steps": 877, "total_steps": 1314, "eval_loss": 0.6201021671295166, "epoch": 1.9994301994301993, "percentage": 66.74, "elapsed_time": "13:03:48", "remaining_time": "6:30:33"}
|
90 |
{"current_steps": 880, "total_steps": 1314, "loss": 0.6215, "learning_rate": 1.7144163926130621e-06, "epoch": 2.006837606837607, "percentage": 66.97, "elapsed_time": "13:07:32", "remaining_time": "6:28:23"}
|
91 |
+
{"current_steps": 890, "total_steps": 1314, "loss": 0.5677, "learning_rate": 1.6644663166838153e-06, "epoch": 2.0296296296296297, "percentage": 67.73, "elapsed_time": "13:16:18", "remaining_time": "6:19:21"}
|
92 |
+
{"current_steps": 900, "total_steps": 1314, "loss": 0.5834, "learning_rate": 1.6152040863247986e-06, "epoch": 2.0524216524216525, "percentage": 68.49, "elapsed_time": "13:25:04", "remaining_time": "6:10:19"}
|
93 |
+
{"current_steps": 910, "total_steps": 1314, "loss": 0.5813, "learning_rate": 1.5666609164190258e-06, "epoch": 2.0752136752136754, "percentage": 69.25, "elapsed_time": "13:33:50", "remaining_time": "6:01:18"}
|
94 |
+
{"current_steps": 920, "total_steps": 1314, "loss": 0.5844, "learning_rate": 1.5188675662187419e-06, "epoch": 2.098005698005698, "percentage": 70.02, "elapsed_time": "13:42:35", "remaining_time": "5:52:17"}
|
95 |
+
{"current_steps": 930, "total_steps": 1314, "loss": 0.582, "learning_rate": 1.4718543198548998e-06, "epoch": 2.1207977207977207, "percentage": 70.78, "elapsed_time": "13:51:22", "remaining_time": "5:43:16"}
|
96 |
+
{"current_steps": 940, "total_steps": 1314, "loss": 0.5767, "learning_rate": 1.425650967147707e-06, "epoch": 2.1435897435897435, "percentage": 71.54, "elapsed_time": "14:00:07", "remaining_time": "5:34:15"}
|
97 |
+
{"current_steps": 950, "total_steps": 1314, "loss": 0.5776, "learning_rate": 1.3802867847303786e-06, "epoch": 2.1663817663817664, "percentage": 72.3, "elapsed_time": "14:08:52", "remaining_time": "5:25:15"}
|
98 |
+
{"current_steps": 960, "total_steps": 1314, "loss": 0.5825, "learning_rate": 1.3357905174980784e-06, "epoch": 2.1891737891737892, "percentage": 73.06, "elapsed_time": "14:17:37", "remaining_time": "5:16:14"}
|
99 |
+
{"current_steps": 970, "total_steps": 1314, "loss": 0.5814, "learning_rate": 1.292190360393788e-06, "epoch": 2.211965811965812, "percentage": 73.82, "elapsed_time": "14:26:21", "remaining_time": "5:07:14"}
|
100 |
+
{"current_steps": 980, "total_steps": 1314, "loss": 0.5711, "learning_rate": 1.2495139405426606e-06, "epoch": 2.234757834757835, "percentage": 74.58, "elapsed_time": "14:35:06", "remaining_time": "4:58:15"}
|
101 |
+
{"current_steps": 990, "total_steps": 1314, "loss": 0.58, "learning_rate": 1.2077882997461603e-06, "epoch": 2.2575498575498574, "percentage": 75.34, "elapsed_time": "14:43:52", "remaining_time": "4:49:16"}
|
102 |
+
{"current_steps": 1000, "total_steps": 1314, "loss": 0.5801, "learning_rate": 1.1670398773471007e-06, "epoch": 2.2803418803418802, "percentage": 76.1, "elapsed_time": "14:52:38", "remaining_time": "4:40:17"}
|
103 |
+
{"current_steps": 1010, "total_steps": 1314, "loss": 0.5777, "learning_rate": 1.1272944934764177e-06, "epoch": 2.303133903133903, "percentage": 76.86, "elapsed_time": "15:01:22", "remaining_time": "4:31:18"}
|
104 |
+
{"current_steps": 1020, "total_steps": 1314, "loss": 0.5806, "learning_rate": 1.0885773326923188e-06, "epoch": 2.325925925925926, "percentage": 77.63, "elapsed_time": "15:10:07", "remaining_time": "4:22:19"}
|
105 |
+
{"current_steps": 1030, "total_steps": 1314, "loss": 0.582, "learning_rate": 1.0509129280221493e-06, "epoch": 2.348717948717949, "percentage": 78.39, "elapsed_time": "15:18:53", "remaining_time": "4:13:21"}
|
106 |
+
{"current_steps": 1040, "total_steps": 1314, "loss": 0.5797, "learning_rate": 1.0143251454171064e-06, "epoch": 2.3715099715099717, "percentage": 79.15, "elapsed_time": "15:27:37", "remaining_time": "4:04:23"}
|
107 |
+
{"current_steps": 1050, "total_steps": 1314, "loss": 0.5791, "learning_rate": 9.788371686296375e-07, "epoch": 2.394301994301994, "percentage": 79.91, "elapsed_time": "15:36:22", "remaining_time": "3:55:25"}
|
108 |
+
{"current_steps": 1060, "total_steps": 1314, "loss": 0.5871, "learning_rate": 9.444714845231223e-07, "epoch": 2.417094017094017, "percentage": 80.67, "elapsed_time": "15:45:06", "remaining_time": "3:46:28"}
|
109 |
+
{"current_steps": 1070, "total_steps": 1314, "loss": 0.5903, "learning_rate": 9.112498688231268e-07, "epoch": 2.43988603988604, "percentage": 81.43, "elapsed_time": "15:53:52", "remaining_time": "3:37:31"}
|
110 |
+
{"current_steps": 1080, "total_steps": 1314, "loss": 0.5855, "learning_rate": 8.791933723192731e-07, "epoch": 2.4626780626780627, "percentage": 82.19, "elapsed_time": "16:02:38", "remaining_time": "3:28:34"}
|
111 |
+
{"current_steps": 1090, "total_steps": 1314, "loss": 0.5829, "learning_rate": 8.483223075264621e-07, "epoch": 2.4854700854700855, "percentage": 82.95, "elapsed_time": "16:11:24", "remaining_time": "3:19:37"}
|
112 |
+
{"current_steps": 1100, "total_steps": 1314, "loss": 0.5895, "learning_rate": 8.186562358138997e-07, "epoch": 2.5082621082621084, "percentage": 83.71, "elapsed_time": "16:20:10", "remaining_time": "3:10:41"}
|
113 |
+
{"current_steps": 1110, "total_steps": 1314, "loss": 0.5824, "learning_rate": 7.902139550100899e-07, "epoch": 2.5310541310541312, "percentage": 84.47, "elapsed_time": "16:28:56", "remaining_time": "3:01:45"}
|
114 |
+
{"current_steps": 1120, "total_steps": 1314, "loss": 0.5808, "learning_rate": 7.630134874916379e-07, "epoch": 2.5538461538461537, "percentage": 85.24, "elapsed_time": "16:37:41", "remaining_time": "2:52:48"}
|
115 |
+
{"current_steps": 1130, "total_steps": 1314, "loss": 0.5801, "learning_rate": 7.370720687634186e-07, "epoch": 2.5766381766381765, "percentage": 86.0, "elapsed_time": "16:46:27", "remaining_time": "2:43:53"}
|
116 |
+
{"current_steps": 1140, "total_steps": 1314, "loss": 0.5797, "learning_rate": 7.124061365373441e-07, "epoch": 2.5994301994301994, "percentage": 86.76, "elapsed_time": "16:55:13", "remaining_time": "2:34:57"}
|
117 |
+
{"current_steps": 1150, "total_steps": 1314, "loss": 0.5799, "learning_rate": 6.890313203166517e-07, "epoch": 2.6222222222222222, "percentage": 87.52, "elapsed_time": "17:03:58", "remaining_time": "2:26:01"}
|
118 |
+
{"current_steps": 1160, "total_steps": 1314, "loss": 0.5807, "learning_rate": 6.669624314923094e-07, "epoch": 2.645014245014245, "percentage": 88.28, "elapsed_time": "17:12:45", "remaining_time": "2:17:06"}
|
119 |
+
{"current_steps": 1170, "total_steps": 1314, "loss": 0.5839, "learning_rate": 6.462134539578169e-07, "epoch": 2.667806267806268, "percentage": 89.04, "elapsed_time": "17:21:31", "remaining_time": "2:08:11"}
|
120 |
+
{"current_steps": 1180, "total_steps": 1314, "loss": 0.5789, "learning_rate": 6.267975352483476e-07, "epoch": 2.690598290598291, "percentage": 89.8, "elapsed_time": "17:30:17", "remaining_time": "1:59:16"}
|
121 |
+
{"current_steps": 1190, "total_steps": 1314, "loss": 0.5798, "learning_rate": 6.087269782098488e-07, "epoch": 2.7133903133903132, "percentage": 90.56, "elapsed_time": "17:39:03", "remaining_time": "1:50:21"}
|
122 |
+
{"current_steps": 1200, "total_steps": 1314, "loss": 0.583, "learning_rate": 5.920132332033751e-07, "epoch": 2.736182336182336, "percentage": 91.32, "elapsed_time": "17:47:49", "remaining_time": "1:41:26"}
|
123 |
+
{"current_steps": 1210, "total_steps": 1314, "loss": 0.5863, "learning_rate": 5.766668908495966e-07, "epoch": 2.758974358974359, "percentage": 92.09, "elapsed_time": "17:56:36", "remaining_time": "1:32:32"}
|
124 |
+
{"current_steps": 1220, "total_steps": 1314, "loss": 0.576, "learning_rate": 5.626976753180799e-07, "epoch": 2.781766381766382, "percentage": 92.85, "elapsed_time": "18:05:23", "remaining_time": "1:23:37"}
|
125 |
+
{"current_steps": 1230, "total_steps": 1314, "loss": 0.5746, "learning_rate": 5.501144381655945e-07, "epoch": 2.8045584045584047, "percentage": 93.61, "elapsed_time": "18:14:09", "remaining_time": "1:14:43"}
|
126 |
+
{"current_steps": 1240, "total_steps": 1314, "loss": 0.5894, "learning_rate": 5.389251527273468e-07, "epoch": 2.827350427350427, "percentage": 94.37, "elapsed_time": "18:22:55", "remaining_time": "1:05:49"}
|
127 |
+
{"current_steps": 1250, "total_steps": 1314, "loss": 0.5863, "learning_rate": 5.291369090646962e-07, "epoch": 2.8501424501424504, "percentage": 95.13, "elapsed_time": "18:31:41", "remaining_time": "0:56:55"}
|
128 |
+
{"current_steps": 1260, "total_steps": 1314, "loss": 0.5834, "learning_rate": 5.207559094725573e-07, "epoch": 2.872934472934473, "percentage": 95.89, "elapsed_time": "18:40:27", "remaining_time": "0:48:01"}
|
129 |
+
{"current_steps": 1270, "total_steps": 1314, "loss": 0.5843, "learning_rate": 5.137874645493318e-07, "epoch": 2.8957264957264957, "percentage": 96.65, "elapsed_time": "18:49:13", "remaining_time": "0:39:07"}
|
130 |
+
{"current_steps": 1280, "total_steps": 1314, "loss": 0.5745, "learning_rate": 5.082359898318615e-07, "epoch": 2.9185185185185185, "percentage": 97.41, "elapsed_time": "18:57:59", "remaining_time": "0:30:13"}
|
131 |
+
{"current_steps": 1290, "total_steps": 1314, "loss": 0.5744, "learning_rate": 5.041050029975357e-07, "epoch": 2.9413105413105414, "percentage": 98.17, "elapsed_time": "19:06:45", "remaining_time": "0:21:20"}
|
132 |
+
{"current_steps": 1300, "total_steps": 1314, "loss": 0.5756, "learning_rate": 5.013971216353229e-07, "epoch": 2.9641025641025642, "percentage": 98.93, "elapsed_time": "19:15:32", "remaining_time": "0:12:26"}
|
133 |
+
{"current_steps": 1310, "total_steps": 1314, "loss": 0.5858, "learning_rate": 5.001140615871431e-07, "epoch": 2.9868945868945866, "percentage": 99.7, "elapsed_time": "19:24:18", "remaining_time": "0:03:33"}
|