evgmaslov commited on
Commit
24dcb7c
·
verified ·
1 Parent(s): 076e547

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db7393a00b23c188bb726efbdf23677d14ce6d8b17888a4fe426f83a22ba0d46
3
  size 157308096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b88e26b3c4ca161876578eead64e78efe3b3e2821830560c1c97c813c468f224
3
  size 157308096
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f33b321c7bf7df2a4b6bc46e3e86b50207c7b2a2b34118f8114072b044f4d43
3
  size 314671226
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a385a4ca54748984eabf77bdd9e798a5e8fc9caf8ee4975a63d25a159e6c1a14
3
  size 314671226
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9afbf9b2cc7ffb82e39603ea3e9793624776e974898f71cddb75c50b95a8ff20
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf67396b3f5e7812c3f643f4791afc66cf2fff82b1f835f1b6ad24a482f916d
3
  size 15920
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca4fa167ac420fbc12a0b1225ad375db648a55f16b7e4866651104ea0cc00a49
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8087188847eb84108011bace714d18665773726c961ffd953c373d3f67be38ac
3
  size 15920
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e799329eb62e1eb372f5e1a106e0710d002dddfe0cb96b7478769d095e752b5f
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61125affad5badfd455e8c7159bc1d0b871f0ac92fdd51cf256c2c41166e1e61
3
  size 15920
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:148ecc351dae84aea8cdc86447e26d57a1165551634773232252cd35029fec44
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abff5899c002d2436c9775c2d31f07f3860e32bc366743306ba740ce007b61af
3
  size 15920
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6c737fa9218e50ea3ce9320b640c05dff0f18b8b0409fe5e3f6340fa144ae6f
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:348c3b3827abbe2c183d19854f3cd62cdb609a4c9ae3c8da2a88576282b91074
3
  size 15920
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40fdcad7ba51bcc458150b1d4b2c87d4dee4fcbb7619ccd347b91ff0f61763b2
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47a1cbe7224ddcd45ba51cd82e937371aec5c1844f6e9a2e51ed4929da4a1380
3
  size 15920
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3d21b509f3e70f8a0fe13164c8b6d889c6ab04755a1218812e3a6427ea94537
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bc846e4b568eb6761e0906589aaea0b96addeb10845d66b84daf70a7f9bd338
3
  size 15920
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1304350d7f8258aaa5c749bd82f5c7ddf08eafecb5eb5f18652eb3f7d1198b19
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d09531311015d468fca38f844a94113b24df2885708c8302833f4fbd34dfc01
3
  size 15920
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d0bcc3306c506981564a07ff3b261b32731741ed53940e879827feb4c6814eb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:142423e5284e8a2b264afd5ee9e923d28ec4d4b3096cd413897dc990937cc484
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.013807659968733788,
3
- "best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-300",
4
- "epoch": 0.37546933667083854,
5
  "eval_steps": 100,
6
- "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -31,6 +31,14 @@
31
  "eval_samples_per_second": 6.011,
32
  "eval_steps_per_second": 0.376,
33
  "step": 300
 
 
 
 
 
 
 
 
34
  }
35
  ],
36
  "logging_steps": 500,
@@ -50,7 +58,7 @@
50
  "attributes": {}
51
  }
52
  },
53
- "total_flos": 3.425702422511616e+17,
54
  "train_batch_size": 2,
55
  "trial_name": null,
56
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.013731677085161209,
3
+ "best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-400",
4
+ "epoch": 0.5006257822277848,
5
  "eval_steps": 100,
6
+ "global_step": 400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
31
  "eval_samples_per_second": 6.011,
32
  "eval_steps_per_second": 0.376,
33
  "step": 300
34
+ },
35
+ {
36
+ "epoch": 0.5006257822277848,
37
+ "eval_loss": 0.013731677085161209,
38
+ "eval_runtime": 5.3205,
39
+ "eval_samples_per_second": 6.014,
40
+ "eval_steps_per_second": 0.376,
41
+ "step": 400
42
  }
43
  ],
44
  "logging_steps": 500,
 
58
  "attributes": {}
59
  }
60
  },
61
+ "total_flos": 4.567603230015488e+17,
62
  "train_batch_size": 2,
63
  "trial_name": null,
64
  "trial_params": null