vkasera commited on
Commit
416abc1
·
verified ·
1 Parent(s): 474c73b

Model save

Browse files
Files changed (3) hide show
  1. all_results.json +4 -4
  2. train_results.json +4 -4
  3. trainer_state.json +37 -10
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 0.0,
3
- "train_loss": 0.0535218224234672,
4
- "train_runtime": 8287.7289,
5
  "train_samples": 45000,
6
- "train_samples_per_second": 1.738,
7
- "train_steps_per_second": 0.054
8
  }
 
1
  {
2
  "total_flos": 0.0,
3
+ "train_loss": 0.00019274518191153618,
4
+ "train_runtime": 48.1888,
5
  "train_samples": 45000,
6
+ "train_samples_per_second": 132.811,
7
+ "train_steps_per_second": 4.15
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 0.0,
3
- "train_loss": 0.0535218224234672,
4
- "train_runtime": 8287.7289,
5
  "train_samples": 45000,
6
- "train_samples_per_second": 1.738,
7
- "train_steps_per_second": 0.054
8
  }
 
1
  {
2
  "total_flos": 0.0,
3
+ "train_loss": 0.00019274518191153618,
4
+ "train_runtime": 48.1888,
5
  "train_samples": 45000,
6
+ "train_samples_per_second": 132.811,
7
+ "train_steps_per_second": 4.15
8
  }
trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.04,
6
  "eval_steps": 500,
7
- "global_step": 450,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7660,18 +7660,45 @@
7660
  "step": 450
7661
  },
7662
  {
7663
- "epoch": 0.04,
7664
- "step": 450,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7665
  "total_flos": 0.0,
7666
- "train_loss": 0.0535218224234672,
7667
- "train_runtime": 8287.7289,
7668
- "train_samples_per_second": 1.738,
7669
- "train_steps_per_second": 0.054
7670
  }
7671
  ],
7672
  "logging_steps": 2,
7673
- "max_steps": 450,
7674
- "num_input_tokens_seen": 7418212,
7675
  "num_train_epochs": 1,
7676
  "save_steps": 20,
7677
  "stateful_callbacks": {
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.04008888888888889,
6
  "eval_steps": 500,
7
+ "global_step": 451,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7660
  "step": 450
7661
  },
7662
  {
7663
+ "clip_ratio/high_max": 0.0,
7664
+ "clip_ratio/high_mean": 0.0,
7665
+ "clip_ratio/low_mean": 0.0,
7666
+ "clip_ratio/low_min": 0.0,
7667
+ "clip_ratio/region_mean": 0.0,
7668
+ "completions/clipped_ratio": 0.03125,
7669
+ "completions/max_length": 1024.0,
7670
+ "completions/max_terminated_length": 738.0,
7671
+ "completions/mean_length": 384.4375,
7672
+ "completions/mean_terminated_length": 363.8064270019531,
7673
+ "completions/min_length": 138.0,
7674
+ "completions/min_terminated_length": 138.0,
7675
+ "entropy": 0.9260082840919495,
7676
+ "epoch": 0.04008888888888889,
7677
+ "frac_reward_zero_std": 0.75,
7678
+ "kl": 0.04489966729306616,
7679
+ "num_tokens": 7435458.0,
7680
+ "reward": 0.9375,
7681
+ "reward_std": 0.1157275140285492,
7682
+ "rewards/equation_reward_func/mean": 0.0,
7683
+ "rewards/equation_reward_func/std": 0.0,
7684
+ "rewards/format_reward_func/mean": 0.9375,
7685
+ "rewards/format_reward_func/std": 0.24593468010425568,
7686
+ "sampling/importance_sampling_ratio/max": 2.0,
7687
+ "sampling/importance_sampling_ratio/mean": 0.9999629259109497,
7688
+ "sampling/importance_sampling_ratio/min": 0.6872801184654236,
7689
+ "sampling/sampling_logp_difference/max": 0.7735042572021484,
7690
+ "sampling/sampling_logp_difference/mean": 0.017714163288474083,
7691
+ "step": 451,
7692
  "total_flos": 0.0,
7693
+ "train_loss": 0.00019274518191153618,
7694
+ "train_runtime": 48.1888,
7695
+ "train_samples_per_second": 132.811,
7696
+ "train_steps_per_second": 4.15
7697
  }
7698
  ],
7699
  "logging_steps": 2,
7700
+ "max_steps": 200,
7701
+ "num_input_tokens_seen": 7435458,
7702
  "num_train_epochs": 1,
7703
  "save_steps": 20,
7704
  "stateful_callbacks": {