{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.4234014597448438, | |
"eval_loss": 3.0190186500549316, | |
"eval_runtime": 111.5107, | |
"eval_samples": 52440, | |
"eval_samples_per_second": 470.269, | |
"eval_steps_per_second": 7.354, | |
"perplexity": 20.47119242004321, | |
"total_flos": 1.29957250203648e+18, | |
"train_loss": 2.7038125842232534, | |
"train_runtime": 44110.0674, | |
"train_samples": 497364, | |
"train_samples_per_second": 225.51, | |
"train_steps_per_second": 7.047 | |
} |