{ "epoch": 1.9961464354527938, "eval_loss": 0.27941030263900757, "eval_runtime": 142.8124, "eval_samples": 1998, "eval_samples_per_second": 13.99, "eval_steps_per_second": 0.441, "total_flos": 2.6836433607911014e+17, "train_loss": 0.7686227933723033, "train_runtime": 16387.3806, "train_samples": 33211, "train_samples_per_second": 4.053, "train_steps_per_second": 0.032 }