{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.7551218228545009, | |
"eval_loss": 4.475677013397217, | |
"eval_runtime": 256.477, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 470.631, | |
"eval_steps_per_second": 4.905, | |
"perplexity": 87.85405865517882, | |
"total_flos": 1.5101928630878515e+19, | |
"train_loss": 5.231086326933267, | |
"train_runtime": 273328.675, | |
"train_samples": 2277342, | |
"train_samples_per_second": 208.297, | |
"train_steps_per_second": 2.17 | |
} |