{ "epoch": 10.0, "eval_loss": 0.09128045290708542, "eval_runtime": 407.0256, "eval_samples_per_second": 89.392, "eval_steps_per_second": 22.35, "num_input_tokens_seen": 250787112, "total_flos": 1.1314919730737775e+19, "train_loss": 0.03974567347884284, "train_runtime": 164298.4475, "train_samples_per_second": 19.931, "train_steps_per_second": 4.983 }