{ "epoch": 0.9999557541701695, "eval_accuracy": 0.5529722548590473, "eval_loss": 2.0769529342651367, "eval_runtime": 11.3861, "eval_samples": 318, "eval_samples_per_second": 27.929, "eval_steps_per_second": 0.439, "perplexity": 7.980115892812829, "total_flos": 1.1360877451905964e+21, "train_loss": 2.231945479570237, "train_runtime": 110078.6466, "train_samples": 1446409, "train_samples_per_second": 13.14, "train_steps_per_second": 0.103 }