llama3-3b-coding-gpt4o-100k2 / all_results.json
chansung's picture
End of training
69d5cee verified
raw
history blame contribute delete
413 Bytes
{
"epoch": 9.85925925925926,
"eval_loss": 1.630096197128296,
"eval_runtime": 0.9031,
"eval_samples": 16,
"eval_samples_per_second": 4.429,
"eval_steps_per_second": 1.107,
"total_flos": 2.9601022627828204e+18,
"train_loss": 0.9062140895359552,
"train_runtime": 3484.2972,
"train_samples": 116368,
"train_samples_per_second": 49.516,
"train_steps_per_second": 0.192
}