{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.41021489963935376, | |
"eval_loss": 3.423628807067871, | |
"eval_runtime": 154.4177, | |
"eval_samples": 57917, | |
"eval_samples_per_second": 375.067, | |
"eval_steps_per_second": 5.861, | |
"perplexity": 30.68054704672833, | |
"total_flos": 1.5670047538944e+18, | |
"train_loss": 3.0279207580395733, | |
"train_runtime": 82395.3872, | |
"train_samples": 595065, | |
"train_samples_per_second": 144.441, | |
"train_steps_per_second": 4.514 | |
} |