{ | |
"epoch": 19.992235020059532, | |
"eval_accuracy": 0.42861324947683616, | |
"eval_loss": 2.9304451942443848, | |
"eval_runtime": 110.0361, | |
"eval_samples": 52190, | |
"eval_samples_per_second": 474.299, | |
"eval_steps_per_second": 7.416, | |
"perplexity": 18.735969786145102, | |
"total_flos": 1.291633274290176e+18, | |
"train_loss": 3.0124951987362847, | |
"train_runtime": 40662.5012, | |
"train_samples": 494517, | |
"train_samples_per_second": 243.23, | |
"train_steps_per_second": 0.95 | |
} |