PhoenixB commited on
Commit
7168d3c
·
verified ·
1 Parent(s): 5be9fe8

Training in progress, step 24, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7afb463104162bf4e9f1d10076bf189c7d775e4575db1da1224a852baa88b767
3
  size 161533192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ba439b31da40ff6545b36f10bf2088503cd9dea9d31f61fb9a3d8017beae65c
3
  size 161533192
last-checkpoint/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4df9d9f2b8d46b1730c5a393376634fbf7d7edfba1f71f4c55808c0ce5a5af37
3
  size 323311082
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b167ec1b666e8efbcade53545b496c1fa7f52cd8119115ce70f37b4cbf323b9
3
  size 323311082
last-checkpoint/pytorch_model_fsdp.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:938dc7835e27c1d17ad3e4ccaa82831bf6732d830784887d63a6ca026feada4d
3
  size 161626662
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18083d90c673193948f1cfa9c2bd07fe9b613716d27d6061ff34a78ffe28be12
3
  size 161626662
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bebf6cc5c8c7780feadaebd275d45bcf2ecda4d47e61bbd51368454f4d1c553
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21b50e03f15fbc12dbbda95def3adbd15c7f7294db0db88cc217672a7686e8b4
3
  size 14512
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88eb0519ba5419045287051a9023514a1ac66b2ff4faa690c6ef26d732fe7601
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a475bf81f402c30ceed6fd5d0f731aea39f076be079d3c3684f6d4e6041d1462
3
  size 14512
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d66ac607544becbf0b1e2248ebb09e59e5572bf9bfa9d7d701b793d0945c55db
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:859214dc387eb3e62419c68b424697c31e86f60684ce969a4432863354d30aa8
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.01353528843055108,
6
  "eval_steps": 3,
7
- "global_step": 21,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -219,6 +219,35 @@
219
  "eval_samples_per_second": 10.959,
220
  "eval_steps_per_second": 2.74,
221
  "step": 21
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
222
  }
223
  ],
224
  "logging_steps": 1,
@@ -238,7 +267,7 @@
238
  "attributes": {}
239
  }
240
  },
241
- "total_flos": 1.919921093921997e+16,
242
  "train_batch_size": 2,
243
  "trial_name": null,
244
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.015468901063486949,
6
  "eval_steps": 3,
7
+ "global_step": 24,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
219
  "eval_samples_per_second": 10.959,
220
  "eval_steps_per_second": 2.74,
221
  "step": 21
222
+ },
223
+ {
224
+ "epoch": 0.014179825974863036,
225
+ "grad_norm": 0.7142388224601746,
226
+ "learning_rate": 5.7422070843492734e-05,
227
+ "loss": 1.4037,
228
+ "step": 22
229
+ },
230
+ {
231
+ "epoch": 0.014824363519174991,
232
+ "grad_norm": 0.9205169081687927,
233
+ "learning_rate": 4.6417320502100316e-05,
234
+ "loss": 1.6486,
235
+ "step": 23
236
+ },
237
+ {
238
+ "epoch": 0.015468901063486949,
239
+ "grad_norm": 1.2948448657989502,
240
+ "learning_rate": 3.6257601025131026e-05,
241
+ "loss": 1.6989,
242
+ "step": 24
243
+ },
244
+ {
245
+ "epoch": 0.015468901063486949,
246
+ "eval_loss": 3.01545786857605,
247
+ "eval_runtime": 460.7675,
248
+ "eval_samples_per_second": 11.344,
249
+ "eval_steps_per_second": 2.837,
250
+ "step": 24
251
  }
252
  ],
253
  "logging_steps": 1,
 
267
  "attributes": {}
268
  }
269
  },
270
+ "total_flos": 2.028467876213555e+16,
271
  "train_batch_size": 2,
272
  "trial_name": null,
273
  "trial_params": null