{ "epoch": 0.0067933301849093615, "eval_accuracy": 0.09167533902983765, "eval_loss": 8.9140625, "eval_runtime": 492.4035, "eval_samples": 33767, "eval_samples_per_second": 68.576, "eval_steps_per_second": 2.857, "perplexity": 7435.807790500043, "total_flos": 1043124562427904.0, "train_loss": 9.606408756684491, "train_runtime": 94484.0244, "train_samples": 660643, "train_samples_per_second": 699.211, "train_steps_per_second": 29.134 }