{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.731461833901348, | |
"eval_loss": 3.1051392555236816, | |
"eval_runtime": 146.3683, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 824.673, | |
"eval_steps_per_second": 8.595, | |
"perplexity": 22.31232587356851, | |
"total_flos": 7.65181665004032e+18, | |
"train_loss": 3.640720207871391, | |
"train_runtime": 132653.8084, | |
"train_samples": 2277342, | |
"train_samples_per_second": 429.189, | |
"train_steps_per_second": 4.471 | |
} |