lesso08 commited on
Commit
686f179
·
verified ·
1 Parent(s): d3c81e3

Training in progress, step 11, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:809d286f618987ca63e4c860bd1c08d6a87e41f8d57255781f61654d592b5ae2
3
  size 399632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0a95cc99d679504697a4c5426d479975ae7c4b85530759d2852205b07b6024
3
  size 399632
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4dd79a476039611daae375ced2b47e20ab6b4d45a419d0b80e16cb204e80f4c0
3
  size 531130
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d70d5fd50a4acb379cd33db57335c32c5a5e84f14f1afefd17ee537d5aad2775
3
  size 531130
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67ff61294c07bdbde258211fd9f63ac972a29aa29214a2a7ea0304797cbca74f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ce8c58da92c180686c9bb31860b6a2ffffc161335b433ebf495991fc31705db
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb578e75c11a81e85dda67a691f96ba4793a02960f1409fd3e1511aac873491a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66a94a3823a4b9fc740a7a6ddf0adc605038b3d31dffac6df2de227ea7d92ecd
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 5.40103006362915,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-10",
4
- "epoch": 0.9302325581395349,
5
  "eval_steps": 5,
6
- "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -101,6 +101,13 @@
101
  "eval_samples_per_second": 35.577,
102
  "eval_steps_per_second": 21.346,
103
  "step": 10
 
 
 
 
 
 
 
104
  }
105
  ],
106
  "logging_steps": 1,
@@ -124,12 +131,12 @@
124
  "should_evaluate": false,
125
  "should_log": false,
126
  "should_save": true,
127
- "should_training_stop": false
128
  },
129
  "attributes": {}
130
  }
131
  },
132
- "total_flos": 1899013079040.0,
133
  "train_batch_size": 2,
134
  "trial_name": null,
135
  "trial_params": null
 
1
  {
2
  "best_metric": 5.40103006362915,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-10",
4
+ "epoch": 1.069767441860465,
5
  "eval_steps": 5,
6
+ "global_step": 11,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
101
  "eval_samples_per_second": 35.577,
102
  "eval_steps_per_second": 21.346,
103
  "step": 10
104
+ },
105
+ {
106
+ "epoch": 1.069767441860465,
107
+ "grad_norm": 15934.6513671875,
108
+ "learning_rate": 0.0,
109
+ "loss": 19.8753,
110
+ "step": 11
111
  }
112
  ],
113
  "logging_steps": 1,
 
131
  "should_evaluate": false,
132
  "should_log": false,
133
  "should_save": true,
134
+ "should_training_stop": true
135
  },
136
  "attributes": {}
137
  }
138
  },
139
+ "total_flos": 2088914386944.0,
140
  "train_batch_size": 2,
141
  "trial_name": null,
142
  "trial_params": null