{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.6857676426031905, | |
"eval_loss": 2.85996150970459, | |
"eval_runtime": 181.6889, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 664.356, | |
"eval_steps_per_second": 4.155, | |
"perplexity": 17.460854850184376, | |
"total_flos": 3.037727852389325e+18, | |
"train_loss": 3.5510173419085684, | |
"train_runtime": 125655.4376, | |
"train_samples": 2277342, | |
"train_samples_per_second": 453.093, | |
"train_steps_per_second": 2.832 | |
} |