{ "epoch": 3.0, "total_flos": 1.8124066505760768e+18, "train_loss": 0.1439182724869042, "train_runtime": 556.909, "train_samples_per_second": 130.901, "train_steps_per_second": 1.024 }