qwen3-06.B-sft / all_results.json
vanek-epfl's picture
End of training
d09b2fb verified
{
"epoch": 1.97196261682243,
"eval_loss": 2.7418861389160156,
"eval_runtime": 4.5058,
"eval_samples": 100,
"eval_samples_per_second": 5.326,
"eval_steps_per_second": 5.326,
"total_flos": 4568119699832832.0,
"train_loss": 2.4587962728626325,
"train_runtime": 293.5611,
"train_samples": 1000,
"train_samples_per_second": 1.458,
"train_steps_per_second": 0.361
}