{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.7595563359244226, | |
"eval_loss": 3.4102275371551514, | |
"eval_runtime": 386.7326, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 312.118, | |
"eval_steps_per_second": 3.253, | |
"perplexity": 30.272131510501872, | |
"total_flos": 1.5091168791146803e+19, | |
"train_loss": 4.081508317309086, | |
"train_runtime": 296836.3665, | |
"train_samples": 2277342, | |
"train_samples_per_second": 191.801, | |
"train_steps_per_second": 1.998 | |
} |