{"current_steps": 5, "total_steps": 183, "loss": 5.8337, "learning_rate": 1.997617272301248e-05, "epoch": 0.08080808080808081, "percentage": 2.73, "elapsed_time": "0:02:10", "remaining_time": "1:17:10", "throughput": 1269.36, "total_tokens": 165120} {"current_steps": 10, "total_steps": 183, "loss": 5.3632, "learning_rate": 1.9879568983287468e-05, "epoch": 0.16161616161616163, "percentage": 5.46, "elapsed_time": "0:04:19", "remaining_time": "1:14:57", "throughput": 1270.37, "total_tokens": 330240} {"current_steps": 15, "total_steps": 183, "loss": 4.0589, "learning_rate": 1.9709418174260523e-05, "epoch": 0.24242424242424243, "percentage": 8.2, "elapsed_time": "0:06:29", "remaining_time": "1:12:45", "throughput": 1270.95, "total_tokens": 495360} {"current_steps": 20, "total_steps": 183, "loss": 2.4357, "learning_rate": 1.9466986959828063e-05, "epoch": 0.32323232323232326, "percentage": 10.93, "elapsed_time": "0:08:39", "remaining_time": "1:10:34", "throughput": 1271.3, "total_tokens": 660480} {"current_steps": 25, "total_steps": 183, "loss": 0.9083, "learning_rate": 1.9154080085253665e-05, "epoch": 0.40404040404040403, "percentage": 13.66, "elapsed_time": "0:10:49", "remaining_time": "1:08:23", "throughput": 1271.65, "total_tokens": 825600} {"current_steps": 30, "total_steps": 183, "loss": 0.3938, "learning_rate": 1.877302694199442e-05, "epoch": 0.48484848484848486, "percentage": 16.39, "elapsed_time": "0:12:59", "remaining_time": "1:06:13", "throughput": 1271.48, "total_tokens": 990720} {"current_steps": 35, "total_steps": 183, "loss": 0.0899, "learning_rate": 1.8326664226872063e-05, "epoch": 0.5656565656565656, "percentage": 19.13, "elapsed_time": "0:15:08", "remaining_time": "1:04:03", "throughput": 1271.57, "total_tokens": 1155840} {"current_steps": 40, "total_steps": 183, "loss": 0.146, "learning_rate": 1.78183148246803e-05, "epoch": 0.6464646464646465, "percentage": 21.86, "elapsed_time": "0:17:18", "remaining_time": "1:01:53", "throughput": 1271.62, "total_tokens": 1320960} {"current_steps": 45, "total_steps": 183, "loss": 0.0063, "learning_rate": 1.7251763071433767e-05, "epoch": 0.7272727272727273, "percentage": 24.59, "elapsed_time": "0:19:28", "remaining_time": "0:59:43", "throughput": 1271.67, "total_tokens": 1486080} {"current_steps": 50, "total_steps": 183, "loss": 0.0044, "learning_rate": 1.6631226582407954e-05, "epoch": 0.8080808080808081, "percentage": 27.32, "elapsed_time": "0:21:38", "remaining_time": "0:57:33", "throughput": 1271.67, "total_tokens": 1651200} {"current_steps": 55, "total_steps": 183, "loss": 0.1276, "learning_rate": 1.5961324854692254e-05, "epoch": 0.8888888888888888, "percentage": 30.05, "elapsed_time": "0:23:48", "remaining_time": "0:55:24", "throughput": 1271.68, "total_tokens": 1816320} {"current_steps": 60, "total_steps": 183, "loss": 0.0009, "learning_rate": 1.524704487799008e-05, "epoch": 0.9696969696969697, "percentage": 32.79, "elapsed_time": "0:25:58", "remaining_time": "0:53:13", "throughput": 1271.77, "total_tokens": 1981440} {"current_steps": 65, "total_steps": 183, "loss": 0.0022, "learning_rate": 1.4493704009671614e-05, "epoch": 1.0505050505050506, "percentage": 35.52, "elapsed_time": "0:28:07", "remaining_time": "0:51:04", "throughput": 1271.8, "total_tokens": 2146560} {"current_steps": 70, "total_steps": 183, "loss": 0.0003, "learning_rate": 1.3706910390450679e-05, "epoch": 1.1313131313131313, "percentage": 38.25, "elapsed_time": "0:30:17", "remaining_time": "0:48:54", "throughput": 1271.81, "total_tokens": 2311680} {"current_steps": 75, "total_steps": 183, "loss": 0.0011, "learning_rate": 1.2892521195365679e-05, "epoch": 1.2121212121212122, "percentage": 40.98, "elapsed_time": "0:32:27", "remaining_time": "0:46:44", "throughput": 1271.85, "total_tokens": 2476800} {"current_steps": 80, "total_steps": 183, "loss": 0.0002, "learning_rate": 1.2056599030859367e-05, "epoch": 1.2929292929292928, "percentage": 43.72, "elapsed_time": "0:34:37", "remaining_time": "0:44:34", "throughput": 1271.91, "total_tokens": 2641920} {"current_steps": 85, "total_steps": 183, "loss": 0.0006, "learning_rate": 1.1205366802553231e-05, "epoch": 1.3737373737373737, "percentage": 46.45, "elapsed_time": "0:36:46", "remaining_time": "0:42:24", "throughput": 1271.96, "total_tokens": 2807040} {"current_steps": 90, "total_steps": 183, "loss": 0.0002, "learning_rate": 1.0345161389697083e-05, "epoch": 1.4545454545454546, "percentage": 49.18, "elapsed_time": "0:38:56", "remaining_time": "0:40:14", "throughput": 1272.0, "total_tokens": 2972160} {"current_steps": 95, "total_steps": 183, "loss": 0.0098, "learning_rate": 9.482386471157905e-06, "epoch": 1.5353535353535355, "percentage": 51.91, "elapsed_time": "0:41:06", "remaining_time": "0:38:04", "throughput": 1272.08, "total_tokens": 3137280} {"current_steps": 100, "total_steps": 183, "loss": 0.0006, "learning_rate": 8.62346485412832e-06, "epoch": 1.6161616161616161, "percentage": 54.64, "elapsed_time": "0:43:15", "remaining_time": "0:35:54", "throughput": 1272.11, "total_tokens": 3302400} {"current_steps": 100, "total_steps": 183, "eval_loss": 0.00015967342187650502, "epoch": 1.6161616161616161, "percentage": 54.64, "elapsed_time": "0:43:21", "remaining_time": "0:35:59", "throughput": 1269.55, "total_tokens": 3302400} {"current_steps": 105, "total_steps": 183, "loss": 0.0002, "learning_rate": 7.774790660436857e-06, "epoch": 1.696969696969697, "percentage": 57.38, "elapsed_time": "0:45:32", "remaining_time": "0:33:49", "throughput": 1269.17, "total_tokens": 3467520} {"current_steps": 110, "total_steps": 183, "loss": 0.0002, "learning_rate": 6.942681726402474e-06, "epoch": 1.7777777777777777, "percentage": 60.11, "elapsed_time": "0:47:41", "remaining_time": "0:31:39", "throughput": 1269.35, "total_tokens": 3632640} {"current_steps": 115, "total_steps": 183, "loss": 0.0924, "learning_rate": 6.133332570585813e-06, "epoch": 1.8585858585858586, "percentage": 62.84, "elapsed_time": "0:49:51", "remaining_time": "0:29:28", "throughput": 1269.47, "total_tokens": 3797760} {"current_steps": 120, "total_steps": 183, "loss": 0.0002, "learning_rate": 5.352768279562315e-06, "epoch": 1.9393939393939394, "percentage": 65.57, "elapsed_time": "0:52:01", "remaining_time": "0:27:18", "throughput": 1269.54, "total_tokens": 3962880} {"current_steps": 125, "total_steps": 183, "loss": 0.0002, "learning_rate": 4.606799655008009e-06, "epoch": 2.0202020202020203, "percentage": 68.31, "elapsed_time": "0:54:11", "remaining_time": "0:25:08", "throughput": 1269.67, "total_tokens": 4128000} {"current_steps": 130, "total_steps": 183, "loss": 0.0004, "learning_rate": 3.900979955999271e-06, "epoch": 2.101010101010101, "percentage": 71.04, "elapsed_time": "0:56:21", "remaining_time": "0:22:58", "throughput": 1269.75, "total_tokens": 4293120} {"current_steps": 135, "total_steps": 183, "loss": 0.0001, "learning_rate": 3.2405635585524566e-06, "epoch": 2.1818181818181817, "percentage": 73.77, "elapsed_time": "0:58:30", "remaining_time": "0:20:48", "throughput": 1269.91, "total_tokens": 4458240} {"current_steps": 140, "total_steps": 183, "loss": 0.0876, "learning_rate": 2.6304668401566334e-06, "epoch": 2.2626262626262625, "percentage": 76.5, "elapsed_time": "1:00:40", "remaining_time": "0:18:38", "throughput": 1270.03, "total_tokens": 4623360} {"current_steps": 145, "total_steps": 183, "loss": 0.0005, "learning_rate": 2.075231580489098e-06, "epoch": 2.3434343434343434, "percentage": 79.23, "elapsed_time": "1:02:49", "remaining_time": "0:16:27", "throughput": 1270.16, "total_tokens": 4788480} {"current_steps": 150, "total_steps": 183, "loss": 0.0686, "learning_rate": 1.5789911507718824e-06, "epoch": 2.4242424242424243, "percentage": 81.97, "elapsed_time": "1:04:59", "remaining_time": "0:14:17", "throughput": 1270.23, "total_tokens": 4953600} {"current_steps": 155, "total_steps": 183, "loss": 0.0001, "learning_rate": 1.1454397434679022e-06, "epoch": 2.505050505050505, "percentage": 84.7, "elapsed_time": "1:07:09", "remaining_time": "0:12:07", "throughput": 1270.28, "total_tokens": 5118720} {"current_steps": 160, "total_steps": 183, "loss": 0.0003, "learning_rate": 7.778048713818975e-07, "epoch": 2.5858585858585856, "percentage": 87.43, "elapsed_time": "1:09:19", "remaining_time": "0:09:57", "throughput": 1270.36, "total_tokens": 5283840} {"current_steps": 165, "total_steps": 183, "loss": 0.0006, "learning_rate": 4.788233408928588e-07, "epoch": 2.6666666666666665, "percentage": 90.16, "elapsed_time": "1:11:29", "remaining_time": "0:07:47", "throughput": 1270.45, "total_tokens": 5448960} {"current_steps": 170, "total_steps": 183, "loss": 0.0003, "learning_rate": 2.507208781817638e-07, "epoch": 2.7474747474747474, "percentage": 92.9, "elapsed_time": "1:13:38", "remaining_time": "0:05:37", "throughput": 1270.54, "total_tokens": 5614080} {"current_steps": 175, "total_steps": 183, "loss": 0.0001, "learning_rate": 9.519556012436815e-08, "epoch": 2.8282828282828283, "percentage": 95.63, "elapsed_time": "1:15:48", "remaining_time": "0:03:27", "throughput": 1270.59, "total_tokens": 5779200} {"current_steps": 180, "total_steps": 183, "loss": 0.0002, "learning_rate": 1.340517319543877e-08, "epoch": 2.909090909090909, "percentage": 98.36, "elapsed_time": "1:17:58", "remaining_time": "0:01:17", "throughput": 1270.64, "total_tokens": 5944320} {"current_steps": 183, "total_steps": 183, "epoch": 2.9575757575757575, "percentage": 100.0, "elapsed_time": "1:19:17", "remaining_time": "0:00:00", "throughput": 1270.39, "total_tokens": 6043392}