|
{ |
|
"best_metric": 0.3751698136329651, |
|
"best_model_checkpoint": "faces_age_detection/checkpoint-4060", |
|
"epoch": 10.0, |
|
"eval_steps": 500, |
|
"global_step": 4060, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7212710165047046, |
|
"eval_loss": 0.7058069109916687, |
|
"eval_runtime": 62.5355, |
|
"eval_samples_per_second": 103.669, |
|
"eval_steps_per_second": 3.246, |
|
"step": 406 |
|
}, |
|
{ |
|
"epoch": 1.23, |
|
"learning_rate": 8.87780548628429e-06, |
|
"loss": 0.6936, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7899120777417862, |
|
"eval_loss": 0.5647568702697754, |
|
"eval_runtime": 55.8142, |
|
"eval_samples_per_second": 116.153, |
|
"eval_steps_per_second": 3.637, |
|
"step": 812 |
|
}, |
|
{ |
|
"epoch": 2.46, |
|
"learning_rate": 7.630922693266833e-06, |
|
"loss": 0.4109, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.8095017738701219, |
|
"eval_loss": 0.504371702671051, |
|
"eval_runtime": 67.4983, |
|
"eval_samples_per_second": 96.047, |
|
"eval_steps_per_second": 3.007, |
|
"step": 1218 |
|
}, |
|
{ |
|
"epoch": 3.69, |
|
"learning_rate": 6.384039900249377e-06, |
|
"loss": 0.3018, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8256979793305569, |
|
"eval_loss": 0.45867738127708435, |
|
"eval_runtime": 59.0046, |
|
"eval_samples_per_second": 109.873, |
|
"eval_steps_per_second": 3.44, |
|
"step": 1624 |
|
}, |
|
{ |
|
"epoch": 4.93, |
|
"learning_rate": 5.13715710723192e-06, |
|
"loss": 0.2342, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8258522289063706, |
|
"eval_loss": 0.4397270679473877, |
|
"eval_runtime": 58.6333, |
|
"eval_samples_per_second": 110.569, |
|
"eval_steps_per_second": 3.462, |
|
"step": 2030 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8364954496375135, |
|
"eval_loss": 0.4140736162662506, |
|
"eval_runtime": 59.1185, |
|
"eval_samples_per_second": 109.661, |
|
"eval_steps_per_second": 3.434, |
|
"step": 2436 |
|
}, |
|
{ |
|
"epoch": 6.16, |
|
"learning_rate": 3.890274314214464e-06, |
|
"loss": 0.1955, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8480641678235384, |
|
"eval_loss": 0.38966086506843567, |
|
"eval_runtime": 61.8272, |
|
"eval_samples_per_second": 104.857, |
|
"eval_steps_per_second": 3.283, |
|
"step": 2842 |
|
}, |
|
{ |
|
"epoch": 7.39, |
|
"learning_rate": 2.643391521197008e-06, |
|
"loss": 0.155, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8537714021286441, |
|
"eval_loss": 0.381708025932312, |
|
"eval_runtime": 58.9967, |
|
"eval_samples_per_second": 109.887, |
|
"eval_steps_per_second": 3.441, |
|
"step": 3248 |
|
}, |
|
{ |
|
"epoch": 8.62, |
|
"learning_rate": 1.396508728179551e-06, |
|
"loss": 0.1312, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8576276415239859, |
|
"eval_loss": 0.3779039680957794, |
|
"eval_runtime": 56.914, |
|
"eval_samples_per_second": 113.909, |
|
"eval_steps_per_second": 3.567, |
|
"step": 3654 |
|
}, |
|
{ |
|
"epoch": 9.85, |
|
"learning_rate": 1.4962593516209478e-07, |
|
"loss": 0.1166, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8557766466142218, |
|
"eval_loss": 0.3751698136329651, |
|
"eval_runtime": 56.9282, |
|
"eval_samples_per_second": 113.88, |
|
"eval_steps_per_second": 3.566, |
|
"step": 4060 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4060, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"total_flos": 2.0093078073456787e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|