{ "epoch": 25.0, "eval_accuracy": 0.7595563359244226, "eval_loss": 3.4102275371551514, "eval_runtime": 386.7326, "eval_samples": 120706, "eval_samples_per_second": 312.118, "eval_steps_per_second": 3.253, "perplexity": 30.272131510501872, "total_flos": 1.5091168791146803e+19, "train_loss": 4.081508317309086, "train_runtime": 296836.3665, "train_samples": 2277342, "train_samples_per_second": 191.801, "train_steps_per_second": 1.998 }