marefa-ner / trainer_state.json
bakrianoo's picture
v-1.0.1
2b4990c
raw
history blame
13.3 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 3.704618424302297,
"global_step": 30000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.06,
"learning_rate": 1.9794187865316542e-05,
"loss": 0.7638,
"step": 500
},
{
"epoch": 0.12,
"learning_rate": 1.958837573063308e-05,
"loss": 0.5165,
"step": 1000
},
{
"epoch": 0.19,
"learning_rate": 1.938256359594962e-05,
"loss": 0.457,
"step": 1500
},
{
"epoch": 0.25,
"learning_rate": 1.917675146126616e-05,
"loss": 0.4516,
"step": 2000
},
{
"epoch": 0.31,
"learning_rate": 1.8970939326582696e-05,
"loss": 0.4095,
"step": 2500
},
{
"epoch": 0.37,
"learning_rate": 1.8765127191899236e-05,
"loss": 0.4188,
"step": 3000
},
{
"epoch": 0.43,
"learning_rate": 1.8559315057215776e-05,
"loss": 0.4028,
"step": 3500
},
{
"epoch": 0.49,
"learning_rate": 1.8353502922532313e-05,
"loss": 0.3846,
"step": 4000
},
{
"epoch": 0.56,
"learning_rate": 1.8147690787848853e-05,
"loss": 0.3813,
"step": 4500
},
{
"epoch": 0.62,
"learning_rate": 1.7941878653165393e-05,
"loss": 0.3842,
"step": 5000
},
{
"epoch": 0.68,
"learning_rate": 1.773606651848193e-05,
"loss": 0.3977,
"step": 5500
},
{
"epoch": 0.74,
"learning_rate": 1.753025438379847e-05,
"loss": 0.3749,
"step": 6000
},
{
"epoch": 0.8,
"learning_rate": 1.732444224911501e-05,
"loss": 0.3578,
"step": 6500
},
{
"epoch": 0.86,
"learning_rate": 1.711863011443155e-05,
"loss": 0.339,
"step": 7000
},
{
"epoch": 0.93,
"learning_rate": 1.6912817979748087e-05,
"loss": 0.3704,
"step": 7500
},
{
"epoch": 0.99,
"learning_rate": 1.6707005845064627e-05,
"loss": 0.3423,
"step": 8000
},
{
"epoch": 1.05,
"learning_rate": 1.6501193710381164e-05,
"loss": 0.2788,
"step": 8500
},
{
"epoch": 1.11,
"learning_rate": 1.6295381575697704e-05,
"loss": 0.2832,
"step": 9000
},
{
"epoch": 1.17,
"learning_rate": 1.6089569441014244e-05,
"loss": 0.3032,
"step": 9500
},
{
"epoch": 1.23,
"learning_rate": 1.588375730633078e-05,
"loss": 0.2774,
"step": 10000
},
{
"epoch": 1.23,
"eval_artwork": {
"f1": 0.3447251114413076,
"number": 295,
"precision": 0.30687830687830686,
"recall": 0.39322033898305087
},
"eval_event": {
"f1": 0.43632567849686854,
"number": 519,
"precision": 0.4760820045558087,
"recall": 0.4026974951830443
},
"eval_job": {
"f1": 0.6786657067434606,
"number": 2257,
"precision": 0.7403141361256544,
"recall": 0.6264953478068233
},
"eval_location": {
"f1": 0.6351052692799815,
"number": 4375,
"precision": 0.6466129796305069,
"recall": 0.624
},
"eval_loss": 0.9446586966514587,
"eval_nationality": {
"f1": 0.6808716707021791,
"number": 2137,
"precision": 0.7054691419969895,
"recall": 0.6579316799251287
},
"eval_organization": {
"f1": 0.5520833333333333,
"number": 1982,
"precision": 0.6044417767106842,
"recall": 0.5080726538849647
},
"eval_overall_accuracy": 0.8332146471271692,
"eval_overall_f1": 0.6393731397679646,
"eval_overall_precision": 0.6567667061833157,
"eval_overall_recall": 0.6228770933191313,
"eval_person": {
"f1": 0.7589572006134114,
"number": 3322,
"precision": 0.7068293949623474,
"recall": 0.8193859121011439
},
"eval_product": {
"f1": 0.3201754385964912,
"number": 323,
"precision": 0.5488721804511278,
"recall": 0.2260061919504644
},
"eval_runtime": 43.8587,
"eval_samples_per_second": 35.911,
"eval_time": {
"f1": 0.5435339308578744,
"number": 1689,
"precision": 0.5916376306620209,
"recall": 0.5026642984014209
},
"step": 10000
},
{
"epoch": 1.3,
"learning_rate": 1.567794517164732e-05,
"loss": 0.2914,
"step": 10500
},
{
"epoch": 1.36,
"learning_rate": 1.547213303696386e-05,
"loss": 0.2878,
"step": 11000
},
{
"epoch": 1.42,
"learning_rate": 1.52663209022804e-05,
"loss": 0.2649,
"step": 11500
},
{
"epoch": 1.48,
"learning_rate": 1.506050876759694e-05,
"loss": 0.2794,
"step": 12000
},
{
"epoch": 1.54,
"learning_rate": 1.4854696632913477e-05,
"loss": 0.288,
"step": 12500
},
{
"epoch": 1.61,
"learning_rate": 1.4648884498230017e-05,
"loss": 0.2663,
"step": 13000
},
{
"epoch": 1.67,
"learning_rate": 1.4443072363546555e-05,
"loss": 0.2853,
"step": 13500
},
{
"epoch": 1.73,
"learning_rate": 1.4237260228863094e-05,
"loss": 0.2718,
"step": 14000
},
{
"epoch": 1.79,
"learning_rate": 1.4031448094179634e-05,
"loss": 0.2944,
"step": 14500
},
{
"epoch": 1.85,
"learning_rate": 1.3825635959496172e-05,
"loss": 0.2804,
"step": 15000
},
{
"epoch": 1.91,
"learning_rate": 1.3619823824812712e-05,
"loss": 0.2631,
"step": 15500
},
{
"epoch": 1.98,
"learning_rate": 1.3414011690129251e-05,
"loss": 0.2937,
"step": 16000
},
{
"epoch": 2.04,
"learning_rate": 1.3208199555445791e-05,
"loss": 0.2301,
"step": 16500
},
{
"epoch": 2.1,
"learning_rate": 1.300238742076233e-05,
"loss": 0.2136,
"step": 17000
},
{
"epoch": 2.16,
"learning_rate": 1.2796575286078868e-05,
"loss": 0.2054,
"step": 17500
},
{
"epoch": 2.22,
"learning_rate": 1.2590763151395406e-05,
"loss": 0.2215,
"step": 18000
},
{
"epoch": 2.28,
"learning_rate": 1.2384951016711945e-05,
"loss": 0.2237,
"step": 18500
},
{
"epoch": 2.35,
"learning_rate": 1.2179138882028485e-05,
"loss": 0.2124,
"step": 19000
},
{
"epoch": 2.41,
"learning_rate": 1.1973326747345024e-05,
"loss": 0.2042,
"step": 19500
},
{
"epoch": 2.47,
"learning_rate": 1.1767514612661564e-05,
"loss": 0.2253,
"step": 20000
},
{
"epoch": 2.47,
"eval_artwork": {
"f1": 0.30398069963811825,
"number": 295,
"precision": 0.23595505617977527,
"recall": 0.4271186440677966
},
"eval_event": {
"f1": 0.38726790450928383,
"number": 519,
"precision": 0.35784313725490197,
"recall": 0.42196531791907516
},
"eval_job": {
"f1": 0.6671604938271605,
"number": 2257,
"precision": 0.7534857780256553,
"recall": 0.5985821887461231
},
"eval_location": {
"f1": 0.6328576483075834,
"number": 4375,
"precision": 0.6537524366471735,
"recall": 0.6132571428571428
},
"eval_loss": 1.0017756223678589,
"eval_nationality": {
"f1": 0.6760161635369623,
"number": 2137,
"precision": 0.6869565217391305,
"recall": 0.6654188114178755
},
"eval_organization": {
"f1": 0.5447824850725049,
"number": 1982,
"precision": 0.6241042345276873,
"recall": 0.48335015136226034
},
"eval_overall_accuracy": 0.8219457041840011,
"eval_overall_f1": 0.6276163319784019,
"eval_overall_precision": 0.643866309827597,
"eval_overall_recall": 0.6121664003787206,
"eval_person": {
"f1": 0.7596614950634696,
"number": 3322,
"precision": 0.7147027600849257,
"recall": 0.8106562311860325
},
"eval_product": {
"f1": 0.3699421965317919,
"number": 323,
"precision": 0.4897959183673469,
"recall": 0.29721362229102166
},
"eval_runtime": 44.5273,
"eval_samples_per_second": 35.372,
"eval_time": {
"f1": 0.5069974554707379,
"number": 1689,
"precision": 0.547766323024055,
"recall": 0.4718768502072232
},
"step": 20000
},
{
"epoch": 2.53,
"learning_rate": 1.1561702477978102e-05,
"loss": 0.2197,
"step": 20500
},
{
"epoch": 2.59,
"learning_rate": 1.1355890343294642e-05,
"loss": 0.2239,
"step": 21000
},
{
"epoch": 2.65,
"learning_rate": 1.115007820861118e-05,
"loss": 0.2231,
"step": 21500
},
{
"epoch": 2.72,
"learning_rate": 1.0944266073927721e-05,
"loss": 0.2045,
"step": 22000
},
{
"epoch": 2.78,
"learning_rate": 1.0738453939244258e-05,
"loss": 0.1935,
"step": 22500
},
{
"epoch": 2.84,
"learning_rate": 1.0532641804560796e-05,
"loss": 0.2156,
"step": 23000
},
{
"epoch": 2.9,
"learning_rate": 1.0326829669877336e-05,
"loss": 0.2088,
"step": 23500
},
{
"epoch": 2.96,
"learning_rate": 1.0121017535193875e-05,
"loss": 0.2022,
"step": 24000
},
{
"epoch": 3.03,
"learning_rate": 9.915205400510415e-06,
"loss": 0.1918,
"step": 24500
},
{
"epoch": 3.09,
"learning_rate": 9.709393265826953e-06,
"loss": 0.1494,
"step": 25000
},
{
"epoch": 3.15,
"learning_rate": 9.503581131143494e-06,
"loss": 0.1502,
"step": 25500
},
{
"epoch": 3.21,
"learning_rate": 9.297768996460032e-06,
"loss": 0.1741,
"step": 26000
},
{
"epoch": 3.27,
"learning_rate": 9.09195686177657e-06,
"loss": 0.1609,
"step": 26500
},
{
"epoch": 3.33,
"learning_rate": 8.88614472709311e-06,
"loss": 0.1584,
"step": 27000
},
{
"epoch": 3.4,
"learning_rate": 8.680332592409649e-06,
"loss": 0.1524,
"step": 27500
},
{
"epoch": 3.46,
"learning_rate": 8.47452045772619e-06,
"loss": 0.1513,
"step": 28000
},
{
"epoch": 3.52,
"learning_rate": 8.268708323042726e-06,
"loss": 0.1595,
"step": 28500
},
{
"epoch": 3.58,
"learning_rate": 8.062896188359266e-06,
"loss": 0.1631,
"step": 29000
},
{
"epoch": 3.64,
"learning_rate": 7.857084053675805e-06,
"loss": 0.1795,
"step": 29500
},
{
"epoch": 3.7,
"learning_rate": 7.651271918992345e-06,
"loss": 0.1602,
"step": 30000
},
{
"epoch": 3.7,
"eval_artwork": {
"f1": 0.32594936708860756,
"number": 295,
"precision": 0.3056379821958457,
"recall": 0.34915254237288135
},
"eval_event": {
"f1": 0.42843232716650437,
"number": 519,
"precision": 0.4330708661417323,
"recall": 0.4238921001926782
},
"eval_job": {
"f1": 0.6932195353247985,
"number": 2257,
"precision": 0.7455379908210097,
"recall": 0.6477625166149756
},
"eval_location": {
"f1": 0.6270144927536232,
"number": 4375,
"precision": 0.636235294117647,
"recall": 0.6180571428571429
},
"eval_loss": 1.0499603748321533,
"eval_nationality": {
"f1": 0.6754837129561596,
"number": 2137,
"precision": 0.7086330935251799,
"recall": 0.6452971455311184
},
"eval_organization": {
"f1": 0.5687919463087249,
"number": 1982,
"precision": 0.6380175658720201,
"recall": 0.5131180625630676
},
"eval_overall_accuracy": 0.8283547593168672,
"eval_overall_f1": 0.6409662071489569,
"eval_overall_precision": 0.6613380326011706,
"eval_overall_recall": 0.6218119415350021,
"eval_person": {
"f1": 0.7734217353704237,
"number": 3322,
"precision": 0.7419800884955752,
"recall": 0.8076459963877183
},
"eval_product": {
"f1": 0.4022556390977444,
"number": 323,
"precision": 0.5119617224880383,
"recall": 0.33126934984520123
},
"eval_runtime": 43.8719,
"eval_samples_per_second": 35.9,
"eval_time": {
"f1": 0.5277161862527716,
"number": 1689,
"precision": 0.5674386920980926,
"recall": 0.4931912374185909
},
"step": 30000
}
],
"max_steps": 48588,
"num_train_epochs": 6,
"total_flos": 3961931727576942.0,
"trial_name": null,
"trial_params": null
}