{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.7530519758192171, | |
"eval_loss": 1.0775210857391357, | |
"eval_runtime": 182.4452, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 661.601, | |
"eval_steps_per_second": 6.895, | |
"perplexity": 2.937388983012658, | |
"total_flos": 1.498518436978944e+19, | |
"train_loss": 2.334269580478457, | |
"train_runtime": 190366.3414, | |
"train_samples": 2277342, | |
"train_samples_per_second": 299.074, | |
"train_steps_per_second": 3.115 | |
} |