Model save
Browse files- all_results.json +4 -4
- train_results.json +4 -4
- trainer_state.json +37 -10
all_results.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"total_flos": 0.0,
|
| 3 |
-
"train_loss": 0.
|
| 4 |
-
"train_runtime":
|
| 5 |
"train_samples": 45000,
|
| 6 |
-
"train_samples_per_second":
|
| 7 |
-
"train_steps_per_second":
|
| 8 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"total_flos": 0.0,
|
| 3 |
+
"train_loss": 0.00019274518191153618,
|
| 4 |
+
"train_runtime": 48.1888,
|
| 5 |
"train_samples": 45000,
|
| 6 |
+
"train_samples_per_second": 132.811,
|
| 7 |
+
"train_steps_per_second": 4.15
|
| 8 |
}
|
train_results.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"total_flos": 0.0,
|
| 3 |
-
"train_loss": 0.
|
| 4 |
-
"train_runtime":
|
| 5 |
"train_samples": 45000,
|
| 6 |
-
"train_samples_per_second":
|
| 7 |
-
"train_steps_per_second":
|
| 8 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"total_flos": 0.0,
|
| 3 |
+
"train_loss": 0.00019274518191153618,
|
| 4 |
+
"train_runtime": 48.1888,
|
| 5 |
"train_samples": 45000,
|
| 6 |
+
"train_samples_per_second": 132.811,
|
| 7 |
+
"train_steps_per_second": 4.15
|
| 8 |
}
|
trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -7660,18 +7660,45 @@
|
|
| 7660 |
"step": 450
|
| 7661 |
},
|
| 7662 |
{
|
| 7663 |
-
"
|
| 7664 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7665 |
"total_flos": 0.0,
|
| 7666 |
-
"train_loss": 0.
|
| 7667 |
-
"train_runtime":
|
| 7668 |
-
"train_samples_per_second":
|
| 7669 |
-
"train_steps_per_second":
|
| 7670 |
}
|
| 7671 |
],
|
| 7672 |
"logging_steps": 2,
|
| 7673 |
-
"max_steps":
|
| 7674 |
-
"num_input_tokens_seen":
|
| 7675 |
"num_train_epochs": 1,
|
| 7676 |
"save_steps": 20,
|
| 7677 |
"stateful_callbacks": {
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.04008888888888889,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 451,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 7660 |
"step": 450
|
| 7661 |
},
|
| 7662 |
{
|
| 7663 |
+
"clip_ratio/high_max": 0.0,
|
| 7664 |
+
"clip_ratio/high_mean": 0.0,
|
| 7665 |
+
"clip_ratio/low_mean": 0.0,
|
| 7666 |
+
"clip_ratio/low_min": 0.0,
|
| 7667 |
+
"clip_ratio/region_mean": 0.0,
|
| 7668 |
+
"completions/clipped_ratio": 0.03125,
|
| 7669 |
+
"completions/max_length": 1024.0,
|
| 7670 |
+
"completions/max_terminated_length": 738.0,
|
| 7671 |
+
"completions/mean_length": 384.4375,
|
| 7672 |
+
"completions/mean_terminated_length": 363.8064270019531,
|
| 7673 |
+
"completions/min_length": 138.0,
|
| 7674 |
+
"completions/min_terminated_length": 138.0,
|
| 7675 |
+
"entropy": 0.9260082840919495,
|
| 7676 |
+
"epoch": 0.04008888888888889,
|
| 7677 |
+
"frac_reward_zero_std": 0.75,
|
| 7678 |
+
"kl": 0.04489966729306616,
|
| 7679 |
+
"num_tokens": 7435458.0,
|
| 7680 |
+
"reward": 0.9375,
|
| 7681 |
+
"reward_std": 0.1157275140285492,
|
| 7682 |
+
"rewards/equation_reward_func/mean": 0.0,
|
| 7683 |
+
"rewards/equation_reward_func/std": 0.0,
|
| 7684 |
+
"rewards/format_reward_func/mean": 0.9375,
|
| 7685 |
+
"rewards/format_reward_func/std": 0.24593468010425568,
|
| 7686 |
+
"sampling/importance_sampling_ratio/max": 2.0,
|
| 7687 |
+
"sampling/importance_sampling_ratio/mean": 0.9999629259109497,
|
| 7688 |
+
"sampling/importance_sampling_ratio/min": 0.6872801184654236,
|
| 7689 |
+
"sampling/sampling_logp_difference/max": 0.7735042572021484,
|
| 7690 |
+
"sampling/sampling_logp_difference/mean": 0.017714163288474083,
|
| 7691 |
+
"step": 451,
|
| 7692 |
"total_flos": 0.0,
|
| 7693 |
+
"train_loss": 0.00019274518191153618,
|
| 7694 |
+
"train_runtime": 48.1888,
|
| 7695 |
+
"train_samples_per_second": 132.811,
|
| 7696 |
+
"train_steps_per_second": 4.15
|
| 7697 |
}
|
| 7698 |
],
|
| 7699 |
"logging_steps": 2,
|
| 7700 |
+
"max_steps": 200,
|
| 7701 |
+
"num_input_tokens_seen": 7435458,
|
| 7702 |
"num_train_epochs": 1,
|
| 7703 |
"save_steps": 20,
|
| 7704 |
"stateful_callbacks": {
|