train_qqp_1753094138 / train_results.json
rbelanec's picture
End of training
67da558 verified
{
"epoch": 10.0,
"num_input_tokens_seen": 250787112,
"total_flos": 1.129312614612566e+19,
"train_loss": 0.10160401221093869,
"train_runtime": 128514.3675,
"train_samples_per_second": 25.48,
"train_steps_per_second": 6.37
}