|
{ |
|
"best_metric": 0.6566383257030739, |
|
"best_model_checkpoint": "twitter-roberta-base-CoNLL/checkpoint-500", |
|
"epoch": 10.0, |
|
"global_step": 540, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.46, |
|
"eval_accuracy": 0.9230280302548782, |
|
"eval_f1": 0.03744493392070484, |
|
"eval_loss": 0.28825512528419495, |
|
"eval_precision": 0.2361111111111111, |
|
"eval_recall": 0.02033492822966507, |
|
"eval_runtime": 1.8273, |
|
"eval_samples_per_second": 552.196, |
|
"eval_steps_per_second": 0.547, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_accuracy": 0.9474988876882985, |
|
"eval_f1": 0.5355029585798816, |
|
"eval_loss": 0.20930655300617218, |
|
"eval_precision": 0.7015503875968992, |
|
"eval_recall": 0.43301435406698563, |
|
"eval_runtime": 1.5316, |
|
"eval_samples_per_second": 658.776, |
|
"eval_steps_per_second": 0.653, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_accuracy": 0.9579228373482489, |
|
"eval_f1": 0.6288323548597522, |
|
"eval_loss": 0.1807074397802353, |
|
"eval_precision": 0.6915351506456241, |
|
"eval_recall": 0.5765550239234449, |
|
"eval_runtime": 1.5064, |
|
"eval_samples_per_second": 669.792, |
|
"eval_steps_per_second": 0.664, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"eval_accuracy": 0.9608466281065277, |
|
"eval_f1": 0.6203411244472521, |
|
"eval_loss": 0.1702219694852829, |
|
"eval_precision": 0.6572958500669344, |
|
"eval_recall": 0.5873205741626795, |
|
"eval_runtime": 1.5233, |
|
"eval_samples_per_second": 662.362, |
|
"eval_steps_per_second": 0.656, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.31, |
|
"eval_accuracy": 0.9616093561304265, |
|
"eval_f1": 0.6293800539083557, |
|
"eval_loss": 0.1766974776983261, |
|
"eval_precision": 0.720679012345679, |
|
"eval_recall": 0.5586124401913876, |
|
"eval_runtime": 1.5236, |
|
"eval_samples_per_second": 662.237, |
|
"eval_steps_per_second": 0.656, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 2.78, |
|
"eval_accuracy": 0.9617364774677429, |
|
"eval_f1": 0.6370860927152318, |
|
"eval_loss": 0.17372390627861023, |
|
"eval_precision": 0.7136498516320475, |
|
"eval_recall": 0.5753588516746412, |
|
"eval_runtime": 1.5265, |
|
"eval_samples_per_second": 660.978, |
|
"eval_steps_per_second": 0.655, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 3.24, |
|
"eval_accuracy": 0.9635161761901735, |
|
"eval_f1": 0.6610279765777489, |
|
"eval_loss": 0.1732863336801529, |
|
"eval_precision": 0.724679029957204, |
|
"eval_recall": 0.6076555023923444, |
|
"eval_runtime": 1.6272, |
|
"eval_samples_per_second": 620.089, |
|
"eval_steps_per_second": 0.615, |
|
"step": 175 |
|
}, |
|
{ |
|
"epoch": 3.7, |
|
"eval_accuracy": 0.9644695862200471, |
|
"eval_f1": 0.6645728643216081, |
|
"eval_loss": 0.16830594837665558, |
|
"eval_precision": 0.6997354497354498, |
|
"eval_recall": 0.6327751196172249, |
|
"eval_runtime": 1.5645, |
|
"eval_samples_per_second": 644.943, |
|
"eval_steps_per_second": 0.639, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.17, |
|
"eval_accuracy": 0.9647873895633382, |
|
"eval_f1": 0.6692160611854684, |
|
"eval_loss": 0.1790447235107422, |
|
"eval_precision": 0.7162346521145976, |
|
"eval_recall": 0.6279904306220095, |
|
"eval_runtime": 1.5303, |
|
"eval_samples_per_second": 659.327, |
|
"eval_steps_per_second": 0.653, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 4.63, |
|
"eval_accuracy": 0.9645331468887053, |
|
"eval_f1": 0.6596858638743455, |
|
"eval_loss": 0.1847098022699356, |
|
"eval_precision": 0.7283236994219653, |
|
"eval_recall": 0.6028708133971292, |
|
"eval_runtime": 1.5507, |
|
"eval_samples_per_second": 650.675, |
|
"eval_steps_per_second": 0.645, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 5.09, |
|
"eval_accuracy": 0.9638339795334647, |
|
"eval_f1": 0.6632057105775471, |
|
"eval_loss": 0.1948511302471161, |
|
"eval_precision": 0.724822695035461, |
|
"eval_recall": 0.611244019138756, |
|
"eval_runtime": 1.7607, |
|
"eval_samples_per_second": 573.054, |
|
"eval_steps_per_second": 0.568, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 5.56, |
|
"eval_accuracy": 0.9647873895633382, |
|
"eval_f1": 0.6649649010848755, |
|
"eval_loss": 0.18528707325458527, |
|
"eval_precision": 0.7127222982216143, |
|
"eval_recall": 0.6232057416267942, |
|
"eval_runtime": 1.5232, |
|
"eval_samples_per_second": 662.408, |
|
"eval_steps_per_second": 0.656, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 6.02, |
|
"eval_accuracy": 0.9644695862200471, |
|
"eval_f1": 0.669172932330827, |
|
"eval_loss": 0.18068380653858185, |
|
"eval_precision": 0.7026315789473684, |
|
"eval_recall": 0.638755980861244, |
|
"eval_runtime": 1.5586, |
|
"eval_samples_per_second": 647.372, |
|
"eval_steps_per_second": 0.642, |
|
"step": 325 |
|
}, |
|
{ |
|
"epoch": 6.48, |
|
"eval_accuracy": 0.9641517828767558, |
|
"eval_f1": 0.664951768488746, |
|
"eval_loss": 0.20004822313785553, |
|
"eval_precision": 0.7190542420027817, |
|
"eval_recall": 0.618421052631579, |
|
"eval_runtime": 1.5707, |
|
"eval_samples_per_second": 642.403, |
|
"eval_steps_per_second": 0.637, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 6.94, |
|
"eval_accuracy": 0.9638339795334647, |
|
"eval_f1": 0.6614987080103358, |
|
"eval_loss": 0.19970329105854034, |
|
"eval_precision": 0.7191011235955056, |
|
"eval_recall": 0.6124401913875598, |
|
"eval_runtime": 1.5546, |
|
"eval_samples_per_second": 649.03, |
|
"eval_steps_per_second": 0.643, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 7.41, |
|
"eval_accuracy": 0.9640246615394394, |
|
"eval_f1": 0.663659793814433, |
|
"eval_loss": 0.2035072147846222, |
|
"eval_precision": 0.7192737430167597, |
|
"eval_recall": 0.6160287081339713, |
|
"eval_runtime": 1.5893, |
|
"eval_samples_per_second": 634.88, |
|
"eval_steps_per_second": 0.629, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.87, |
|
"eval_accuracy": 0.9643424648827306, |
|
"eval_f1": 0.6557169930511686, |
|
"eval_loss": 0.19765512645244598, |
|
"eval_precision": 0.6947791164658634, |
|
"eval_recall": 0.6208133971291866, |
|
"eval_runtime": 1.57, |
|
"eval_samples_per_second": 642.691, |
|
"eval_steps_per_second": 0.637, |
|
"step": 425 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"eval_accuracy": 0.9645331468887053, |
|
"eval_f1": 0.6683706070287541, |
|
"eval_loss": 0.20478704571723938, |
|
"eval_precision": 0.7174211248285323, |
|
"eval_recall": 0.6255980861244019, |
|
"eval_runtime": 1.58, |
|
"eval_samples_per_second": 638.623, |
|
"eval_steps_per_second": 0.633, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"eval_accuracy": 0.964215343545414, |
|
"eval_f1": 0.6610608020698577, |
|
"eval_loss": 0.2073480784893036, |
|
"eval_precision": 0.719718309859155, |
|
"eval_recall": 0.611244019138756, |
|
"eval_runtime": 1.6091, |
|
"eval_samples_per_second": 627.07, |
|
"eval_steps_per_second": 0.621, |
|
"step": 475 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"learning_rate": 3.7037037037037037e-06, |
|
"loss": 0.07, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"eval_accuracy": 0.9638339795334647, |
|
"eval_f1": 0.6566383257030739, |
|
"eval_loss": 0.21393825113773346, |
|
"eval_precision": 0.7243867243867244, |
|
"eval_recall": 0.6004784688995215, |
|
"eval_runtime": 1.5553, |
|
"eval_samples_per_second": 648.763, |
|
"eval_steps_per_second": 0.643, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.72, |
|
"eval_accuracy": 0.96472382889468, |
|
"eval_f1": 0.663284717818643, |
|
"eval_loss": 0.20485757291316986, |
|
"eval_precision": 0.7058029689608637, |
|
"eval_recall": 0.6255980861244019, |
|
"eval_runtime": 1.544, |
|
"eval_samples_per_second": 653.493, |
|
"eval_steps_per_second": 0.648, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 540, |
|
"total_flos": 1009327449452316.0, |
|
"train_loss": 0.06530485324285648, |
|
"train_runtime": 166.7998, |
|
"train_samples_per_second": 203.477, |
|
"train_steps_per_second": 3.237 |
|
} |
|
], |
|
"max_steps": 540, |
|
"num_train_epochs": 10, |
|
"total_flos": 1009327449452316.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|