{ "epoch": 100.0, "total_flos": 4.804632427843584e+17, "train_loss": 0.07632537007331848, "train_runtime": 425.2676, "train_samples_per_second": 14.579, "train_steps_per_second": 0.235 }