{ "best_metric": null, "best_model_checkpoint": null, "epoch": 3.704618424302297, "global_step": 30000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.06, "learning_rate": 1.9794187865316542e-05, "loss": 0.7638, "step": 500 }, { "epoch": 0.12, "learning_rate": 1.958837573063308e-05, "loss": 0.5165, "step": 1000 }, { "epoch": 0.19, "learning_rate": 1.938256359594962e-05, "loss": 0.457, "step": 1500 }, { "epoch": 0.25, "learning_rate": 1.917675146126616e-05, "loss": 0.4516, "step": 2000 }, { "epoch": 0.31, "learning_rate": 1.8970939326582696e-05, "loss": 0.4095, "step": 2500 }, { "epoch": 0.37, "learning_rate": 1.8765127191899236e-05, "loss": 0.4188, "step": 3000 }, { "epoch": 0.43, "learning_rate": 1.8559315057215776e-05, "loss": 0.4028, "step": 3500 }, { "epoch": 0.49, "learning_rate": 1.8353502922532313e-05, "loss": 0.3846, "step": 4000 }, { "epoch": 0.56, "learning_rate": 1.8147690787848853e-05, "loss": 0.3813, "step": 4500 }, { "epoch": 0.62, "learning_rate": 1.7941878653165393e-05, "loss": 0.3842, "step": 5000 }, { "epoch": 0.68, "learning_rate": 1.773606651848193e-05, "loss": 0.3977, "step": 5500 }, { "epoch": 0.74, "learning_rate": 1.753025438379847e-05, "loss": 0.3749, "step": 6000 }, { "epoch": 0.8, "learning_rate": 1.732444224911501e-05, "loss": 0.3578, "step": 6500 }, { "epoch": 0.86, "learning_rate": 1.711863011443155e-05, "loss": 0.339, "step": 7000 }, { "epoch": 0.93, "learning_rate": 1.6912817979748087e-05, "loss": 0.3704, "step": 7500 }, { "epoch": 0.99, "learning_rate": 1.6707005845064627e-05, "loss": 0.3423, "step": 8000 }, { "epoch": 1.05, "learning_rate": 1.6501193710381164e-05, "loss": 0.2788, "step": 8500 }, { "epoch": 1.11, "learning_rate": 1.6295381575697704e-05, "loss": 0.2832, "step": 9000 }, { "epoch": 1.17, "learning_rate": 1.6089569441014244e-05, "loss": 0.3032, "step": 9500 }, { "epoch": 1.23, "learning_rate": 1.588375730633078e-05, "loss": 0.2774, "step": 10000 }, { "epoch": 1.23, "eval_artwork": { "f1": 0.3447251114413076, "number": 295, "precision": 0.30687830687830686, "recall": 0.39322033898305087 }, "eval_event": { "f1": 0.43632567849686854, "number": 519, "precision": 0.4760820045558087, "recall": 0.4026974951830443 }, "eval_job": { "f1": 0.6786657067434606, "number": 2257, "precision": 0.7403141361256544, "recall": 0.6264953478068233 }, "eval_location": { "f1": 0.6351052692799815, "number": 4375, "precision": 0.6466129796305069, "recall": 0.624 }, "eval_loss": 0.9446586966514587, "eval_nationality": { "f1": 0.6808716707021791, "number": 2137, "precision": 0.7054691419969895, "recall": 0.6579316799251287 }, "eval_organization": { "f1": 0.5520833333333333, "number": 1982, "precision": 0.6044417767106842, "recall": 0.5080726538849647 }, "eval_overall_accuracy": 0.8332146471271692, "eval_overall_f1": 0.6393731397679646, "eval_overall_precision": 0.6567667061833157, "eval_overall_recall": 0.6228770933191313, "eval_person": { "f1": 0.7589572006134114, "number": 3322, "precision": 0.7068293949623474, "recall": 0.8193859121011439 }, "eval_product": { "f1": 0.3201754385964912, "number": 323, "precision": 0.5488721804511278, "recall": 0.2260061919504644 }, "eval_runtime": 43.8587, "eval_samples_per_second": 35.911, "eval_time": { "f1": 0.5435339308578744, "number": 1689, "precision": 0.5916376306620209, "recall": 0.5026642984014209 }, "step": 10000 }, { "epoch": 1.3, "learning_rate": 1.567794517164732e-05, "loss": 0.2914, "step": 10500 }, { "epoch": 1.36, "learning_rate": 1.547213303696386e-05, "loss": 0.2878, "step": 11000 }, { "epoch": 1.42, "learning_rate": 1.52663209022804e-05, "loss": 0.2649, "step": 11500 }, { "epoch": 1.48, "learning_rate": 1.506050876759694e-05, "loss": 0.2794, "step": 12000 }, { "epoch": 1.54, "learning_rate": 1.4854696632913477e-05, "loss": 0.288, "step": 12500 }, { "epoch": 1.61, "learning_rate": 1.4648884498230017e-05, "loss": 0.2663, "step": 13000 }, { "epoch": 1.67, "learning_rate": 1.4443072363546555e-05, "loss": 0.2853, "step": 13500 }, { "epoch": 1.73, "learning_rate": 1.4237260228863094e-05, "loss": 0.2718, "step": 14000 }, { "epoch": 1.79, "learning_rate": 1.4031448094179634e-05, "loss": 0.2944, "step": 14500 }, { "epoch": 1.85, "learning_rate": 1.3825635959496172e-05, "loss": 0.2804, "step": 15000 }, { "epoch": 1.91, "learning_rate": 1.3619823824812712e-05, "loss": 0.2631, "step": 15500 }, { "epoch": 1.98, "learning_rate": 1.3414011690129251e-05, "loss": 0.2937, "step": 16000 }, { "epoch": 2.04, "learning_rate": 1.3208199555445791e-05, "loss": 0.2301, "step": 16500 }, { "epoch": 2.1, "learning_rate": 1.300238742076233e-05, "loss": 0.2136, "step": 17000 }, { "epoch": 2.16, "learning_rate": 1.2796575286078868e-05, "loss": 0.2054, "step": 17500 }, { "epoch": 2.22, "learning_rate": 1.2590763151395406e-05, "loss": 0.2215, "step": 18000 }, { "epoch": 2.28, "learning_rate": 1.2384951016711945e-05, "loss": 0.2237, "step": 18500 }, { "epoch": 2.35, "learning_rate": 1.2179138882028485e-05, "loss": 0.2124, "step": 19000 }, { "epoch": 2.41, "learning_rate": 1.1973326747345024e-05, "loss": 0.2042, "step": 19500 }, { "epoch": 2.47, "learning_rate": 1.1767514612661564e-05, "loss": 0.2253, "step": 20000 }, { "epoch": 2.47, "eval_artwork": { "f1": 0.30398069963811825, "number": 295, "precision": 0.23595505617977527, "recall": 0.4271186440677966 }, "eval_event": { "f1": 0.38726790450928383, "number": 519, "precision": 0.35784313725490197, "recall": 0.42196531791907516 }, "eval_job": { "f1": 0.6671604938271605, "number": 2257, "precision": 0.7534857780256553, "recall": 0.5985821887461231 }, "eval_location": { "f1": 0.6328576483075834, "number": 4375, "precision": 0.6537524366471735, "recall": 0.6132571428571428 }, "eval_loss": 1.0017756223678589, "eval_nationality": { "f1": 0.6760161635369623, "number": 2137, "precision": 0.6869565217391305, "recall": 0.6654188114178755 }, "eval_organization": { "f1": 0.5447824850725049, "number": 1982, "precision": 0.6241042345276873, "recall": 0.48335015136226034 }, "eval_overall_accuracy": 0.8219457041840011, "eval_overall_f1": 0.6276163319784019, "eval_overall_precision": 0.643866309827597, "eval_overall_recall": 0.6121664003787206, "eval_person": { "f1": 0.7596614950634696, "number": 3322, "precision": 0.7147027600849257, "recall": 0.8106562311860325 }, "eval_product": { "f1": 0.3699421965317919, "number": 323, "precision": 0.4897959183673469, "recall": 0.29721362229102166 }, "eval_runtime": 44.5273, "eval_samples_per_second": 35.372, "eval_time": { "f1": 0.5069974554707379, "number": 1689, "precision": 0.547766323024055, "recall": 0.4718768502072232 }, "step": 20000 }, { "epoch": 2.53, "learning_rate": 1.1561702477978102e-05, "loss": 0.2197, "step": 20500 }, { "epoch": 2.59, "learning_rate": 1.1355890343294642e-05, "loss": 0.2239, "step": 21000 }, { "epoch": 2.65, "learning_rate": 1.115007820861118e-05, "loss": 0.2231, "step": 21500 }, { "epoch": 2.72, "learning_rate": 1.0944266073927721e-05, "loss": 0.2045, "step": 22000 }, { "epoch": 2.78, "learning_rate": 1.0738453939244258e-05, "loss": 0.1935, "step": 22500 }, { "epoch": 2.84, "learning_rate": 1.0532641804560796e-05, "loss": 0.2156, "step": 23000 }, { "epoch": 2.9, "learning_rate": 1.0326829669877336e-05, "loss": 0.2088, "step": 23500 }, { "epoch": 2.96, "learning_rate": 1.0121017535193875e-05, "loss": 0.2022, "step": 24000 }, { "epoch": 3.03, "learning_rate": 9.915205400510415e-06, "loss": 0.1918, "step": 24500 }, { "epoch": 3.09, "learning_rate": 9.709393265826953e-06, "loss": 0.1494, "step": 25000 }, { "epoch": 3.15, "learning_rate": 9.503581131143494e-06, "loss": 0.1502, "step": 25500 }, { "epoch": 3.21, "learning_rate": 9.297768996460032e-06, "loss": 0.1741, "step": 26000 }, { "epoch": 3.27, "learning_rate": 9.09195686177657e-06, "loss": 0.1609, "step": 26500 }, { "epoch": 3.33, "learning_rate": 8.88614472709311e-06, "loss": 0.1584, "step": 27000 }, { "epoch": 3.4, "learning_rate": 8.680332592409649e-06, "loss": 0.1524, "step": 27500 }, { "epoch": 3.46, "learning_rate": 8.47452045772619e-06, "loss": 0.1513, "step": 28000 }, { "epoch": 3.52, "learning_rate": 8.268708323042726e-06, "loss": 0.1595, "step": 28500 }, { "epoch": 3.58, "learning_rate": 8.062896188359266e-06, "loss": 0.1631, "step": 29000 }, { "epoch": 3.64, "learning_rate": 7.857084053675805e-06, "loss": 0.1795, "step": 29500 }, { "epoch": 3.7, "learning_rate": 7.651271918992345e-06, "loss": 0.1602, "step": 30000 }, { "epoch": 3.7, "eval_artwork": { "f1": 0.32594936708860756, "number": 295, "precision": 0.3056379821958457, "recall": 0.34915254237288135 }, "eval_event": { "f1": 0.42843232716650437, "number": 519, "precision": 0.4330708661417323, "recall": 0.4238921001926782 }, "eval_job": { "f1": 0.6932195353247985, "number": 2257, "precision": 0.7455379908210097, "recall": 0.6477625166149756 }, "eval_location": { "f1": 0.6270144927536232, "number": 4375, "precision": 0.636235294117647, "recall": 0.6180571428571429 }, "eval_loss": 1.0499603748321533, "eval_nationality": { "f1": 0.6754837129561596, "number": 2137, "precision": 0.7086330935251799, "recall": 0.6452971455311184 }, "eval_organization": { "f1": 0.5687919463087249, "number": 1982, "precision": 0.6380175658720201, "recall": 0.5131180625630676 }, "eval_overall_accuracy": 0.8283547593168672, "eval_overall_f1": 0.6409662071489569, "eval_overall_precision": 0.6613380326011706, "eval_overall_recall": 0.6218119415350021, "eval_person": { "f1": 0.7734217353704237, "number": 3322, "precision": 0.7419800884955752, "recall": 0.8076459963877183 }, "eval_product": { "f1": 0.4022556390977444, "number": 323, "precision": 0.5119617224880383, "recall": 0.33126934984520123 }, "eval_runtime": 43.8719, "eval_samples_per_second": 35.9, "eval_time": { "f1": 0.5277161862527716, "number": 1689, "precision": 0.5674386920980926, "recall": 0.4931912374185909 }, "step": 30000 } ], "max_steps": 48588, "num_train_epochs": 6, "total_flos": 3961931727576942.0, "trial_name": null, "trial_params": null }