{ | |
"epoch": 0.9999557541701695, | |
"eval_accuracy": 0.5529722548590473, | |
"eval_loss": 2.0769529342651367, | |
"eval_runtime": 11.3861, | |
"eval_samples": 318, | |
"eval_samples_per_second": 27.929, | |
"eval_steps_per_second": 0.439, | |
"perplexity": 7.980115892812829, | |
"total_flos": 1.1360877451905964e+21, | |
"train_loss": 2.231945479570237, | |
"train_runtime": 110078.6466, | |
"train_samples": 1446409, | |
"train_samples_per_second": 13.14, | |
"train_steps_per_second": 0.103 | |
} |