{ "epoch": 4.0, "total_flos": 3.205097416476426e+17, "train_loss": 0.11358193889833414, "train_runtime": 228.8792, "train_samples_per_second": 18.071, "train_steps_per_second": 2.272 }