{ "epoch": 20.0, "eval_accuracy": 0.4234014597448438, "eval_loss": 3.0190186500549316, "eval_runtime": 111.5306, "eval_samples": 52440, "eval_samples_per_second": 470.185, "eval_steps_per_second": 7.352, "perplexity": 20.47119242004321, "total_flos": 1.29957250203648e+18, "train_loss": 2.7038125842232534, "train_runtime": 43992.4165, "train_samples": 497364, "train_samples_per_second": 226.114, "train_steps_per_second": 7.066 }