Mistral-7b-uncensored-sft-lora / trainer_log.jsonl
jdqqjr's picture
init
00e6106
{"current_steps": 10, "total_steps": 1352, "loss": 0.6972, "learning_rate": 9.998650208062712e-05, "epoch": 0.059084194977843424, "percentage": 0.74, "elapsed_time": "0:02:55", "remaining_time": "6:31:38"}
{"current_steps": 20, "total_steps": 1352, "loss": 0.5423, "learning_rate": 9.994601561026155e-05, "epoch": 0.11816838995568685, "percentage": 1.48, "elapsed_time": "0:05:43", "remaining_time": "6:21:30"}
{"current_steps": 30, "total_steps": 1352, "loss": 0.5149, "learning_rate": 9.98785624482278e-05, "epoch": 0.17725258493353027, "percentage": 2.22, "elapsed_time": "0:08:36", "remaining_time": "6:18:58"}
{"current_steps": 40, "total_steps": 1352, "loss": 0.513, "learning_rate": 9.978417901361958e-05, "epoch": 0.2363367799113737, "percentage": 2.96, "elapsed_time": "0:11:26", "remaining_time": "6:15:08"}
{"current_steps": 50, "total_steps": 1352, "loss": 0.4957, "learning_rate": 9.96629162656365e-05, "epoch": 0.29542097488921715, "percentage": 3.7, "elapsed_time": "0:14:14", "remaining_time": "6:10:46"}
{"current_steps": 60, "total_steps": 1352, "loss": 0.495, "learning_rate": 9.951483967607041e-05, "epoch": 0.35450516986706054, "percentage": 4.44, "elapsed_time": "0:17:01", "remaining_time": "6:06:31"}
{"current_steps": 70, "total_steps": 1352, "loss": 0.4943, "learning_rate": 9.934002919395592e-05, "epoch": 0.413589364844904, "percentage": 5.18, "elapsed_time": "0:19:47", "remaining_time": "6:02:28"}
{"current_steps": 80, "total_steps": 1352, "loss": 0.4738, "learning_rate": 9.91385792024048e-05, "epoch": 0.4726735598227474, "percentage": 5.92, "elapsed_time": "0:22:37", "remaining_time": "5:59:41"}
{"current_steps": 90, "total_steps": 1352, "loss": 0.4565, "learning_rate": 9.891059846764679e-05, "epoch": 0.5317577548005908, "percentage": 6.66, "elapsed_time": "0:25:27", "remaining_time": "5:56:54"}
{"current_steps": 100, "total_steps": 1352, "loss": 0.4674, "learning_rate": 9.865621008030492e-05, "epoch": 0.5908419497784343, "percentage": 7.4, "elapsed_time": "0:28:13", "remaining_time": "5:53:22"}
{"current_steps": 110, "total_steps": 1352, "loss": 0.4727, "learning_rate": 9.83755513889369e-05, "epoch": 0.6499261447562777, "percentage": 8.14, "elapsed_time": "0:31:02", "remaining_time": "5:50:31"}
{"current_steps": 120, "total_steps": 1352, "loss": 0.4736, "learning_rate": 9.80687739258782e-05, "epoch": 0.7090103397341211, "percentage": 8.88, "elapsed_time": "0:33:49", "remaining_time": "5:47:18"}
{"current_steps": 130, "total_steps": 1352, "loss": 0.47, "learning_rate": 9.773604332542729e-05, "epoch": 0.7680945347119645, "percentage": 9.62, "elapsed_time": "0:36:36", "remaining_time": "5:44:02"}
{"current_steps": 140, "total_steps": 1352, "loss": 0.467, "learning_rate": 9.737753923441688e-05, "epoch": 0.827178729689808, "percentage": 10.36, "elapsed_time": "0:39:26", "remaining_time": "5:41:26"}
{"current_steps": 150, "total_steps": 1352, "loss": 0.4522, "learning_rate": 9.69934552152196e-05, "epoch": 0.8862629246676514, "percentage": 11.09, "elapsed_time": "0:42:15", "remaining_time": "5:38:37"}
{"current_steps": 160, "total_steps": 1352, "loss": 0.4613, "learning_rate": 9.658399864124037e-05, "epoch": 0.9453471196454948, "percentage": 11.83, "elapsed_time": "0:45:01", "remaining_time": "5:35:24"}
{"current_steps": 170, "total_steps": 1352, "loss": 0.4641, "learning_rate": 9.61493905849521e-05, "epoch": 1.0044313146233383, "percentage": 12.57, "elapsed_time": "0:47:48", "remaining_time": "5:32:25"}
{"current_steps": 180, "total_steps": 1352, "loss": 0.3946, "learning_rate": 9.568986569853487e-05, "epoch": 1.0635155096011817, "percentage": 13.31, "elapsed_time": "0:50:42", "remaining_time": "5:30:07"}
{"current_steps": 190, "total_steps": 1352, "loss": 0.3882, "learning_rate": 9.520567208718337e-05, "epoch": 1.122599704579025, "percentage": 14.05, "elapsed_time": "0:53:31", "remaining_time": "5:27:20"}
{"current_steps": 200, "total_steps": 1352, "loss": 0.4205, "learning_rate": 9.469707117515067e-05, "epoch": 1.1816838995568686, "percentage": 14.79, "elapsed_time": "0:56:16", "remaining_time": "5:24:07"}
{"current_steps": 210, "total_steps": 1352, "loss": 0.386, "learning_rate": 9.416433756460091e-05, "epoch": 1.240768094534712, "percentage": 15.53, "elapsed_time": "0:59:03", "remaining_time": "5:21:09"}
{"current_steps": 220, "total_steps": 1352, "loss": 0.4096, "learning_rate": 9.360775888734698e-05, "epoch": 1.2998522895125553, "percentage": 16.27, "elapsed_time": "1:01:50", "remaining_time": "5:18:10"}
{"current_steps": 230, "total_steps": 1352, "loss": 0.3921, "learning_rate": 9.302763564955331e-05, "epoch": 1.3589364844903988, "percentage": 17.01, "elapsed_time": "1:04:39", "remaining_time": "5:15:23"}
{"current_steps": 240, "total_steps": 1352, "loss": 0.3788, "learning_rate": 9.242428106948749e-05, "epoch": 1.4180206794682422, "percentage": 17.75, "elapsed_time": "1:07:30", "remaining_time": "5:12:45"}
{"current_steps": 250, "total_steps": 1352, "loss": 0.3894, "learning_rate": 9.179802090840853e-05, "epoch": 1.4771048744460857, "percentage": 18.49, "elapsed_time": "1:10:19", "remaining_time": "5:09:59"}
{"current_steps": 260, "total_steps": 1352, "loss": 0.3707, "learning_rate": 9.114919329468282e-05, "epoch": 1.536189069423929, "percentage": 19.23, "elapsed_time": "1:13:12", "remaining_time": "5:07:27"}
{"current_steps": 270, "total_steps": 1352, "loss": 0.3938, "learning_rate": 9.04781485412231e-05, "epoch": 1.5952732644017726, "percentage": 19.97, "elapsed_time": "1:15:55", "remaining_time": "5:04:16"}
{"current_steps": 280, "total_steps": 1352, "loss": 0.3799, "learning_rate": 8.978524895634842e-05, "epoch": 1.654357459379616, "percentage": 20.71, "elapsed_time": "1:18:46", "remaining_time": "5:01:35"}
{"current_steps": 290, "total_steps": 1352, "loss": 0.403, "learning_rate": 8.907086864816803e-05, "epoch": 1.7134416543574593, "percentage": 21.45, "elapsed_time": "1:21:33", "remaining_time": "4:58:40"}
{"current_steps": 300, "total_steps": 1352, "loss": 0.3758, "learning_rate": 8.833539332259398e-05, "epoch": 1.7725258493353029, "percentage": 22.19, "elapsed_time": "1:24:28", "remaining_time": "4:56:12"}
{"current_steps": 310, "total_steps": 1352, "loss": 0.3963, "learning_rate": 8.757922007509207e-05, "epoch": 1.8316100443131462, "percentage": 22.93, "elapsed_time": "1:27:16", "remaining_time": "4:53:23"}
{"current_steps": 320, "total_steps": 1352, "loss": 0.3858, "learning_rate": 8.680275717628337e-05, "epoch": 1.8906942392909896, "percentage": 23.67, "elapsed_time": "1:30:06", "remaining_time": "4:50:35"}
{"current_steps": 330, "total_steps": 1352, "loss": 0.3799, "learning_rate": 8.600642385151205e-05, "epoch": 1.9497784342688331, "percentage": 24.41, "elapsed_time": "1:32:52", "remaining_time": "4:47:37"}
{"current_steps": 340, "total_steps": 1352, "loss": 0.3763, "learning_rate": 8.519065005449858e-05, "epoch": 2.0088626292466767, "percentage": 25.15, "elapsed_time": "1:35:37", "remaining_time": "4:44:37"}
{"current_steps": 350, "total_steps": 1352, "loss": 0.2934, "learning_rate": 8.43558762352005e-05, "epoch": 2.06794682422452, "percentage": 25.89, "elapsed_time": "1:38:32", "remaining_time": "4:42:05"}
{"current_steps": 360, "total_steps": 1352, "loss": 0.3078, "learning_rate": 8.350255310200612e-05, "epoch": 2.1270310192023634, "percentage": 26.63, "elapsed_time": "1:41:15", "remaining_time": "4:39:01"}
{"current_steps": 370, "total_steps": 1352, "loss": 0.3028, "learning_rate": 8.263114137838947e-05, "epoch": 2.186115214180207, "percentage": 27.37, "elapsed_time": "1:44:01", "remaining_time": "4:36:06"}
{"current_steps": 380, "total_steps": 1352, "loss": 0.2972, "learning_rate": 8.174211155415799e-05, "epoch": 2.24519940915805, "percentage": 28.11, "elapsed_time": "1:46:47", "remaining_time": "4:33:09"}
{"current_steps": 390, "total_steps": 1352, "loss": 0.2995, "learning_rate": 8.083594363142717e-05, "epoch": 2.3042836041358936, "percentage": 28.85, "elapsed_time": "1:49:35", "remaining_time": "4:30:18"}
{"current_steps": 400, "total_steps": 1352, "loss": 0.2963, "learning_rate": 7.991312686545937e-05, "epoch": 2.363367799113737, "percentage": 29.59, "elapsed_time": "1:52:24", "remaining_time": "4:27:32"}
{"current_steps": 410, "total_steps": 1352, "loss": 0.2987, "learning_rate": 7.897415950050676e-05, "epoch": 2.4224519940915803, "percentage": 30.33, "elapsed_time": "1:55:12", "remaining_time": "4:24:40"}
{"current_steps": 420, "total_steps": 1352, "loss": 0.3092, "learning_rate": 7.801954850080075e-05, "epoch": 2.481536189069424, "percentage": 31.07, "elapsed_time": "1:57:55", "remaining_time": "4:21:41"}
{"current_steps": 430, "total_steps": 1352, "loss": 0.2951, "learning_rate": 7.704980927683359e-05, "epoch": 2.5406203840472674, "percentage": 31.8, "elapsed_time": "2:00:50", "remaining_time": "4:19:05"}
{"current_steps": 440, "total_steps": 1352, "loss": 0.3097, "learning_rate": 7.60654654070796e-05, "epoch": 2.5997045790251105, "percentage": 32.54, "elapsed_time": "2:03:35", "remaining_time": "4:16:10"}
{"current_steps": 450, "total_steps": 1352, "loss": 0.2999, "learning_rate": 7.506704835530634e-05, "epoch": 2.658788774002954, "percentage": 33.28, "elapsed_time": "2:06:27", "remaining_time": "4:13:28"}
{"current_steps": 460, "total_steps": 1352, "loss": 0.2905, "learning_rate": 7.405509718362842e-05, "epoch": 2.7178729689807977, "percentage": 34.02, "elapsed_time": "2:09:15", "remaining_time": "4:10:37"}
{"current_steps": 470, "total_steps": 1352, "loss": 0.309, "learning_rate": 7.303015826145885e-05, "epoch": 2.7769571639586412, "percentage": 34.76, "elapsed_time": "2:12:01", "remaining_time": "4:07:45"}
{"current_steps": 480, "total_steps": 1352, "loss": 0.302, "learning_rate": 7.199278497051498e-05, "epoch": 2.8360413589364843, "percentage": 35.5, "elapsed_time": "2:14:51", "remaining_time": "4:05:00"}
{"current_steps": 490, "total_steps": 1352, "loss": 0.297, "learning_rate": 7.094353740603839e-05, "epoch": 2.895125553914328, "percentage": 36.24, "elapsed_time": "2:17:38", "remaining_time": "4:02:07"}
{"current_steps": 500, "total_steps": 1352, "loss": 0.3101, "learning_rate": 6.988298207439021e-05, "epoch": 2.9542097488921715, "percentage": 36.98, "elapsed_time": "2:20:26", "remaining_time": "3:59:18"}
{"current_steps": 500, "total_steps": 1352, "eval_loss": 0.4939613938331604, "epoch": 2.9542097488921715, "percentage": 36.98, "elapsed_time": "2:21:20", "remaining_time": "4:00:49"}
{"current_steps": 510, "total_steps": 1352, "loss": 0.2736, "learning_rate": 6.881169158718474e-05, "epoch": 3.0132939438700146, "percentage": 37.72, "elapsed_time": "2:24:11", "remaining_time": "3:58:03"}
{"current_steps": 520, "total_steps": 1352, "loss": 0.2187, "learning_rate": 6.773024435212678e-05, "epoch": 3.072378138847858, "percentage": 38.46, "elapsed_time": "2:26:58", "remaining_time": "3:55:10"}
{"current_steps": 530, "total_steps": 1352, "loss": 0.2057, "learning_rate": 6.663922426071977e-05, "epoch": 3.1314623338257017, "percentage": 39.2, "elapsed_time": "2:29:45", "remaining_time": "3:52:15"}
{"current_steps": 540, "total_steps": 1352, "loss": 0.2067, "learning_rate": 6.553922037301283e-05, "epoch": 3.1905465288035453, "percentage": 39.94, "elapsed_time": "2:32:39", "remaining_time": "3:49:32"}
{"current_steps": 550, "total_steps": 1352, "loss": 0.1989, "learning_rate": 6.443082659955738e-05, "epoch": 3.2496307237813884, "percentage": 40.68, "elapsed_time": "2:35:33", "remaining_time": "3:46:49"}
{"current_steps": 560, "total_steps": 1352, "loss": 0.2179, "learning_rate": 6.331464138074493e-05, "epoch": 3.308714918759232, "percentage": 41.42, "elapsed_time": "2:38:17", "remaining_time": "3:43:52"}
{"current_steps": 570, "total_steps": 1352, "loss": 0.2176, "learning_rate": 6.219126736369903e-05, "epoch": 3.3677991137370755, "percentage": 42.16, "elapsed_time": "2:41:06", "remaining_time": "3:41:01"}
{"current_steps": 580, "total_steps": 1352, "loss": 0.2215, "learning_rate": 6.106131107689599e-05, "epoch": 3.4268833087149186, "percentage": 42.9, "elapsed_time": "2:43:52", "remaining_time": "3:38:06"}
{"current_steps": 590, "total_steps": 1352, "loss": 0.2153, "learning_rate": 5.9925382602689974e-05, "epoch": 3.485967503692762, "percentage": 43.64, "elapsed_time": "2:46:38", "remaining_time": "3:35:13"}
{"current_steps": 600, "total_steps": 1352, "loss": 0.2133, "learning_rate": 5.8784095247919305e-05, "epoch": 3.5450516986706058, "percentage": 44.38, "elapsed_time": "2:49:26", "remaining_time": "3:32:21"}
{"current_steps": 610, "total_steps": 1352, "loss": 0.2109, "learning_rate": 5.763806521277184e-05, "epoch": 3.604135893648449, "percentage": 45.12, "elapsed_time": "2:52:16", "remaining_time": "3:29:32"}
{"current_steps": 620, "total_steps": 1352, "loss": 0.2214, "learning_rate": 5.648791125808809e-05, "epoch": 3.6632200886262924, "percentage": 45.86, "elapsed_time": "2:55:02", "remaining_time": "3:26:39"}
{"current_steps": 630, "total_steps": 1352, "loss": 0.212, "learning_rate": 5.5334254371281934e-05, "epoch": 3.722304283604136, "percentage": 46.6, "elapsed_time": "2:57:52", "remaining_time": "3:23:51"}
{"current_steps": 640, "total_steps": 1352, "loss": 0.2196, "learning_rate": 5.417771743105907e-05, "epoch": 3.781388478581979, "percentage": 47.34, "elapsed_time": "3:00:45", "remaining_time": "3:21:05"}
{"current_steps": 650, "total_steps": 1352, "loss": 0.2145, "learning_rate": 5.3018924871114305e-05, "epoch": 3.8404726735598227, "percentage": 48.08, "elapsed_time": "3:03:33", "remaining_time": "3:18:14"}
{"current_steps": 660, "total_steps": 1352, "loss": 0.2199, "learning_rate": 5.185850234298942e-05, "epoch": 3.8995568685376663, "percentage": 48.82, "elapsed_time": "3:06:17", "remaining_time": "3:15:19"}
{"current_steps": 670, "total_steps": 1352, "loss": 0.218, "learning_rate": 5.0697076378273354e-05, "epoch": 3.9586410635155094, "percentage": 49.56, "elapsed_time": "3:09:04", "remaining_time": "3:12:27"}
{"current_steps": 680, "total_steps": 1352, "loss": 0.1987, "learning_rate": 4.953527405032723e-05, "epoch": 4.017725258493353, "percentage": 50.3, "elapsed_time": "3:11:51", "remaining_time": "3:09:35"}
{"current_steps": 690, "total_steps": 1352, "loss": 0.1425, "learning_rate": 4.8373722635717086e-05, "epoch": 4.0768094534711965, "percentage": 51.04, "elapsed_time": "3:14:39", "remaining_time": "3:06:45"}
{"current_steps": 700, "total_steps": 1352, "loss": 0.1313, "learning_rate": 4.721304927553658e-05, "epoch": 4.13589364844904, "percentage": 51.78, "elapsed_time": "3:17:26", "remaining_time": "3:03:53"}
{"current_steps": 710, "total_steps": 1352, "loss": 0.1397, "learning_rate": 4.60538806368031e-05, "epoch": 4.194977843426884, "percentage": 52.51, "elapsed_time": "3:20:11", "remaining_time": "3:01:01"}
{"current_steps": 720, "total_steps": 1352, "loss": 0.1421, "learning_rate": 4.489684257410958e-05, "epoch": 4.254062038404727, "percentage": 53.25, "elapsed_time": "3:22:58", "remaining_time": "2:58:09"}
{"current_steps": 730, "total_steps": 1352, "loss": 0.1386, "learning_rate": 4.374255979171538e-05, "epoch": 4.31314623338257, "percentage": 53.99, "elapsed_time": "3:25:45", "remaining_time": "2:55:19"}
{"current_steps": 740, "total_steps": 1352, "loss": 0.1444, "learning_rate": 4.2591655506257645e-05, "epoch": 4.372230428360414, "percentage": 54.73, "elapsed_time": "3:28:35", "remaining_time": "2:52:30"}
{"current_steps": 750, "total_steps": 1352, "loss": 0.1391, "learning_rate": 4.144475111026643e-05, "epoch": 4.431314623338257, "percentage": 55.47, "elapsed_time": "3:31:25", "remaining_time": "2:49:42"}
{"current_steps": 760, "total_steps": 1352, "loss": 0.1438, "learning_rate": 4.030246583666437e-05, "epoch": 4.4903988183161, "percentage": 56.21, "elapsed_time": "3:34:15", "remaining_time": "2:46:53"}
{"current_steps": 770, "total_steps": 1352, "loss": 0.1415, "learning_rate": 3.9165416424432414e-05, "epoch": 4.549483013293944, "percentage": 56.95, "elapsed_time": "3:37:04", "remaining_time": "2:44:04"}
{"current_steps": 780, "total_steps": 1352, "loss": 0.1492, "learning_rate": 3.803421678562213e-05, "epoch": 4.608567208271787, "percentage": 57.69, "elapsed_time": "3:39:52", "remaining_time": "2:41:14"}
{"current_steps": 790, "total_steps": 1352, "loss": 0.1512, "learning_rate": 3.690947767389426e-05, "epoch": 4.66765140324963, "percentage": 58.43, "elapsed_time": "3:42:44", "remaining_time": "2:38:27"}
{"current_steps": 800, "total_steps": 1352, "loss": 0.1481, "learning_rate": 3.57918063547627e-05, "epoch": 4.726735598227474, "percentage": 59.17, "elapsed_time": "3:45:31", "remaining_time": "2:35:36"}
{"current_steps": 810, "total_steps": 1352, "loss": 0.1418, "learning_rate": 3.468180627772144e-05, "epoch": 4.7858197932053175, "percentage": 59.91, "elapsed_time": "3:48:15", "remaining_time": "2:32:44"}
{"current_steps": 820, "total_steps": 1352, "loss": 0.146, "learning_rate": 3.358007675043224e-05, "epoch": 4.844903988183161, "percentage": 60.65, "elapsed_time": "3:51:03", "remaining_time": "2:29:54"}
{"current_steps": 830, "total_steps": 1352, "loss": 0.1407, "learning_rate": 3.2487212615148316e-05, "epoch": 4.903988183161005, "percentage": 61.39, "elapsed_time": "3:53:49", "remaining_time": "2:27:03"}
{"current_steps": 840, "total_steps": 1352, "loss": 0.1502, "learning_rate": 3.1403803927549006e-05, "epoch": 4.963072378138848, "percentage": 62.13, "elapsed_time": "3:56:38", "remaining_time": "2:24:14"}
{"current_steps": 850, "total_steps": 1352, "loss": 0.1322, "learning_rate": 3.0330435638158806e-05, "epoch": 5.022156573116692, "percentage": 62.87, "elapsed_time": "3:59:24", "remaining_time": "2:21:23"}
{"current_steps": 860, "total_steps": 1352, "loss": 0.0985, "learning_rate": 2.9267687276522876e-05, "epoch": 5.081240768094535, "percentage": 63.61, "elapsed_time": "4:02:13", "remaining_time": "2:18:34"}
{"current_steps": 870, "total_steps": 1352, "loss": 0.0929, "learning_rate": 2.821613263830912e-05, "epoch": 5.140324963072378, "percentage": 64.35, "elapsed_time": "4:05:03", "remaining_time": "2:15:46"}
{"current_steps": 880, "total_steps": 1352, "loss": 0.0941, "learning_rate": 2.717633947550651e-05, "epoch": 5.199409158050222, "percentage": 65.09, "elapsed_time": "4:07:51", "remaining_time": "2:12:56"}
{"current_steps": 890, "total_steps": 1352, "loss": 0.0951, "learning_rate": 2.614886918988604e-05, "epoch": 5.258493353028065, "percentage": 65.83, "elapsed_time": "4:10:38", "remaining_time": "2:10:06"}
{"current_steps": 900, "total_steps": 1352, "loss": 0.0926, "learning_rate": 2.5134276529890644e-05, "epoch": 5.317577548005908, "percentage": 66.57, "elapsed_time": "4:13:26", "remaining_time": "2:07:17"}
{"current_steps": 910, "total_steps": 1352, "loss": 0.095, "learning_rate": 2.4133109291117156e-05, "epoch": 5.376661742983752, "percentage": 67.31, "elapsed_time": "4:16:14", "remaining_time": "2:04:27"}
{"current_steps": 920, "total_steps": 1352, "loss": 0.0886, "learning_rate": 2.314590802055232e-05, "epoch": 5.435745937961595, "percentage": 68.05, "elapsed_time": "4:18:58", "remaining_time": "2:01:36"}
{"current_steps": 930, "total_steps": 1352, "loss": 0.096, "learning_rate": 2.2173205724722318e-05, "epoch": 5.4948301329394384, "percentage": 68.79, "elapsed_time": "4:21:47", "remaining_time": "1:58:47"}
{"current_steps": 940, "total_steps": 1352, "loss": 0.0962, "learning_rate": 2.121552758191366e-05, "epoch": 5.5539143279172825, "percentage": 69.53, "elapsed_time": "4:24:31", "remaining_time": "1:55:56"}
{"current_steps": 950, "total_steps": 1352, "loss": 0.0985, "learning_rate": 2.027339065862064e-05, "epoch": 5.612998522895126, "percentage": 70.27, "elapsed_time": "4:27:16", "remaining_time": "1:53:05"}
{"current_steps": 960, "total_steps": 1352, "loss": 0.0939, "learning_rate": 1.934730363037237e-05, "epoch": 5.672082717872969, "percentage": 71.01, "elapsed_time": "4:30:02", "remaining_time": "1:50:16"}
{"current_steps": 970, "total_steps": 1352, "loss": 0.0975, "learning_rate": 1.843776650709046e-05, "epoch": 5.731166912850813, "percentage": 71.75, "elapsed_time": "4:32:47", "remaining_time": "1:47:25"}
{"current_steps": 980, "total_steps": 1352, "loss": 0.093, "learning_rate": 1.7545270363125153e-05, "epoch": 5.790251107828656, "percentage": 72.49, "elapsed_time": "4:35:33", "remaining_time": "1:44:35"}
{"current_steps": 990, "total_steps": 1352, "loss": 0.0959, "learning_rate": 1.6670297072116165e-05, "epoch": 5.849335302806499, "percentage": 73.22, "elapsed_time": "4:38:25", "remaining_time": "1:41:48"}
{"current_steps": 1000, "total_steps": 1352, "loss": 0.0918, "learning_rate": 1.581331904682089e-05, "epoch": 5.908419497784343, "percentage": 73.96, "elapsed_time": "4:41:09", "remaining_time": "1:38:58"}
{"current_steps": 1000, "total_steps": 1352, "eval_loss": 0.7311862707138062, "epoch": 5.908419497784343, "percentage": 73.96, "elapsed_time": "4:42:02", "remaining_time": "1:39:16"}
{"current_steps": 1010, "total_steps": 1352, "loss": 0.0933, "learning_rate": 1.4974798984050942e-05, "epoch": 5.967503692762186, "percentage": 74.7, "elapsed_time": "4:45:04", "remaining_time": "1:36:31"}
{"current_steps": 1020, "total_steps": 1352, "loss": 0.0828, "learning_rate": 1.4155189614854275e-05, "epoch": 6.026587887740029, "percentage": 75.44, "elapsed_time": "4:47:52", "remaining_time": "1:33:41"}
{"current_steps": 1030, "total_steps": 1352, "loss": 0.0678, "learning_rate": 1.3354933460078217e-05, "epoch": 6.085672082717873, "percentage": 76.18, "elapsed_time": "4:50:41", "remaining_time": "1:30:52"}
{"current_steps": 1040, "total_steps": 1352, "loss": 0.0629, "learning_rate": 1.257446259144494e-05, "epoch": 6.144756277695716, "percentage": 76.92, "elapsed_time": "4:53:27", "remaining_time": "1:28:02"}
{"current_steps": 1050, "total_steps": 1352, "loss": 0.0697, "learning_rate": 1.1814198398268794e-05, "epoch": 6.203840472673559, "percentage": 77.66, "elapsed_time": "4:56:13", "remaining_time": "1:25:12"}
{"current_steps": 1060, "total_steps": 1352, "loss": 0.0644, "learning_rate": 1.1074551359941021e-05, "epoch": 6.262924667651403, "percentage": 78.4, "elapsed_time": "4:59:01", "remaining_time": "1:22:22"}
{"current_steps": 1070, "total_steps": 1352, "loss": 0.069, "learning_rate": 1.0355920824305127e-05, "epoch": 6.3220088626292466, "percentage": 79.14, "elapsed_time": "5:01:54", "remaining_time": "1:19:34"}
{"current_steps": 1080, "total_steps": 1352, "loss": 0.0666, "learning_rate": 9.658694792042284e-06, "epoch": 6.381093057607091, "percentage": 79.88, "elapsed_time": "5:04:41", "remaining_time": "1:16:44"}
{"current_steps": 1090, "total_steps": 1352, "loss": 0.0679, "learning_rate": 8.98324970718319e-06, "epoch": 6.440177252584934, "percentage": 80.62, "elapsed_time": "5:07:30", "remaining_time": "1:13:54"}
{"current_steps": 1100, "total_steps": 1352, "loss": 0.0656, "learning_rate": 8.329950253859703e-06, "epoch": 6.499261447562777, "percentage": 81.36, "elapsed_time": "5:10:14", "remaining_time": "1:11:04"}
{"current_steps": 1110, "total_steps": 1352, "loss": 0.0664, "learning_rate": 7.699149159405734e-06, "epoch": 6.558345642540621, "percentage": 82.1, "elapsed_time": "5:13:04", "remaining_time": "1:08:15"}
{"current_steps": 1120, "total_steps": 1352, "loss": 0.0673, "learning_rate": 7.0911870039138015e-06, "epoch": 6.617429837518464, "percentage": 82.84, "elapsed_time": "5:15:53", "remaining_time": "1:05:26"}
{"current_steps": 1130, "total_steps": 1352, "loss": 0.0697, "learning_rate": 6.506392036350167e-06, "epoch": 6.676514032496307, "percentage": 83.58, "elapsed_time": "5:18:38", "remaining_time": "1:02:36"}
{"current_steps": 1140, "total_steps": 1352, "loss": 0.0669, "learning_rate": 5.945079997327713e-06, "epoch": 6.735598227474151, "percentage": 84.32, "elapsed_time": "5:21:24", "remaining_time": "0:59:46"}
{"current_steps": 1150, "total_steps": 1352, "loss": 0.0683, "learning_rate": 5.407553948632277e-06, "epoch": 6.794682422451994, "percentage": 85.06, "elapsed_time": "5:24:09", "remaining_time": "0:56:56"}
{"current_steps": 1160, "total_steps": 1352, "loss": 0.0684, "learning_rate": 4.894104109594466e-06, "epoch": 6.853766617429837, "percentage": 85.8, "elapsed_time": "5:26:58", "remaining_time": "0:54:07"}
{"current_steps": 1170, "total_steps": 1352, "loss": 0.0687, "learning_rate": 4.405007700395497e-06, "epoch": 6.912850812407681, "percentage": 86.54, "elapsed_time": "5:29:44", "remaining_time": "0:51:17"}
{"current_steps": 1180, "total_steps": 1352, "loss": 0.0721, "learning_rate": 3.940528792391223e-06, "epoch": 6.971935007385524, "percentage": 87.28, "elapsed_time": "5:32:25", "remaining_time": "0:48:27"}
{"current_steps": 1190, "total_steps": 1352, "loss": 0.0653, "learning_rate": 3.5009181655356826e-06, "epoch": 7.0310192023633675, "percentage": 88.02, "elapsed_time": "5:35:13", "remaining_time": "0:45:38"}
{"current_steps": 1200, "total_steps": 1352, "loss": 0.0579, "learning_rate": 3.0864131729807398e-06, "epoch": 7.0901033973412115, "percentage": 88.76, "elapsed_time": "5:38:03", "remaining_time": "0:42:49"}
{"current_steps": 1210, "total_steps": 1352, "loss": 0.0585, "learning_rate": 2.6972376129251686e-06, "epoch": 7.149187592319055, "percentage": 89.5, "elapsed_time": "5:40:48", "remaining_time": "0:39:59"}
{"current_steps": 1220, "total_steps": 1352, "loss": 0.0562, "learning_rate": 2.3336016077822154e-06, "epoch": 7.208271787296898, "percentage": 90.24, "elapsed_time": "5:43:37", "remaining_time": "0:37:10"}
{"current_steps": 1230, "total_steps": 1352, "loss": 0.0572, "learning_rate": 1.9957014907310224e-06, "epoch": 7.267355982274742, "percentage": 90.98, "elapsed_time": "5:46:23", "remaining_time": "0:34:21"}
{"current_steps": 1240, "total_steps": 1352, "loss": 0.06, "learning_rate": 1.6837196997130434e-06, "epoch": 7.326440177252585, "percentage": 91.72, "elapsed_time": "5:49:09", "remaining_time": "0:31:32"}
{"current_steps": 1250, "total_steps": 1352, "loss": 0.0565, "learning_rate": 1.3978246789307149e-06, "epoch": 7.385524372230428, "percentage": 92.46, "elapsed_time": "5:51:56", "remaining_time": "0:28:43"}
{"current_steps": 1260, "total_steps": 1352, "loss": 0.0562, "learning_rate": 1.1381707879016157e-06, "epoch": 7.444608567208272, "percentage": 93.2, "elapsed_time": "5:54:44", "remaining_time": "0:25:54"}
{"current_steps": 1270, "total_steps": 1352, "loss": 0.0556, "learning_rate": 9.048982181171894e-07, "epoch": 7.503692762186115, "percentage": 93.93, "elapsed_time": "5:57:33", "remaining_time": "0:23:05"}
{"current_steps": 1280, "total_steps": 1352, "loss": 0.0525, "learning_rate": 6.98132917350991e-07, "epoch": 7.562776957163958, "percentage": 94.67, "elapsed_time": "6:00:22", "remaining_time": "0:20:16"}
{"current_steps": 1290, "total_steps": 1352, "loss": 0.0549, "learning_rate": 5.179865216573654e-07, "epoch": 7.621861152141802, "percentage": 95.41, "elapsed_time": "6:03:03", "remaining_time": "0:17:26"}
{"current_steps": 1300, "total_steps": 1352, "loss": 0.0583, "learning_rate": 3.6455629509730136e-07, "epoch": 7.680945347119645, "percentage": 96.15, "elapsed_time": "6:05:55", "remaining_time": "0:14:38"}
{"current_steps": 1310, "total_steps": 1352, "loss": 0.0553, "learning_rate": 2.3792507722388835e-07, "epoch": 7.7400295420974885, "percentage": 96.89, "elapsed_time": "6:08:39", "remaining_time": "0:11:49"}
{"current_steps": 1320, "total_steps": 1352, "loss": 0.0556, "learning_rate": 1.3816123835588834e-07, "epoch": 7.7991137370753325, "percentage": 97.63, "elapsed_time": "6:11:26", "remaining_time": "0:09:00"}
{"current_steps": 1330, "total_steps": 1352, "loss": 0.0589, "learning_rate": 6.531864266343113e-08, "epoch": 7.858197932053176, "percentage": 98.37, "elapsed_time": "6:14:11", "remaining_time": "0:06:11"}
{"current_steps": 1340, "total_steps": 1352, "loss": 0.0603, "learning_rate": 1.943661908586636e-08, "epoch": 7.917282127031019, "percentage": 99.11, "elapsed_time": "6:17:00", "remaining_time": "0:03:22"}
{"current_steps": 1350, "total_steps": 1352, "loss": 0.0568, "learning_rate": 5.399400973882251e-10, "epoch": 7.976366322008863, "percentage": 99.85, "elapsed_time": "6:19:47", "remaining_time": "0:00:33"}
{"current_steps": 1352, "total_steps": 1352, "epoch": 7.988183161004431, "percentage": 100.0, "elapsed_time": "6:20:18", "remaining_time": "0:00:00"}