{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.7333895906515843, | |
"eval_loss": 2.5845947265625, | |
"eval_runtime": 371.8593, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 324.601, | |
"eval_steps_per_second": 3.383, | |
"perplexity": 13.257914920283664, | |
"total_flos": 7.651144160057088e+18, | |
"train_loss": 3.137090846637658, | |
"train_runtime": 216876.098, | |
"train_samples": 2277342, | |
"train_samples_per_second": 262.516, | |
"train_steps_per_second": 2.735 | |
} |