Training in progress, step 10800, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step10800/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step10800/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step10800/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step10800/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step10800/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step10800/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step10800/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step10800/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +93 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e4513dc6210047a9fb7847fcd8dca9ea72c66f2fa26d93bb8d271292c119000
|
3 |
size 29034840
|
last-checkpoint/global_step10800/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63ce0a2f24316b30f620b7817dac68975b70e7731a2f980ba413040803bfb63b
|
3 |
+
size 43429616
|
last-checkpoint/global_step10800/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2ce3fb811e5ca927632e5643aea491a79735e24c1c30e6f9fbe956ea4b5e346
|
3 |
+
size 43429616
|
last-checkpoint/global_step10800/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab467a149e2303100c799725bb4a91561d762adec22e61a0d320a18e6befc8fe
|
3 |
+
size 43429616
|
last-checkpoint/global_step10800/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1a3c35b256455784ead1e107c4517e95d0d2e26d1b5a4da10fb40285ae7a3fc
|
3 |
+
size 43429616
|
last-checkpoint/global_step10800/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b3c45b6072c8ec1d5de03ae17a5c99d83f5f6d50702503743b6d72503edaa6e
|
3 |
+
size 637299
|
last-checkpoint/global_step10800/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99dcf81581f5f9a4f224dec5b72fb467d95a5ccff25660c64901ddb2828c0309
|
3 |
+
size 637171
|
last-checkpoint/global_step10800/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b0219cf2633ca9908484808e0038e5e7cbaeb4ba3fd3465a482dd73eefcf229
|
3 |
+
size 637171
|
last-checkpoint/global_step10800/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a95eeb140f3beb635de116eb6468962aeb39b2acea57d5f0d055f07d57fe27f
|
3 |
+
size 637171
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step10800
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1697566a46881a626d7b5d7beeaf289eac7abb3228dc7404e0abf936b05d4ecc
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d802f0e69cab074744bc89d46c3b349ac14f92f80481496c2f70e7778110860
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e55641df0b2f672b919df6bc2b163e11f9f68b4af48913c5d1f39652bcf684a
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f31bf4d015bf75b22523ff6d07fa44113e2ddd158194f253c1045597104a3b95
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fff0973103028dda8c2cfd5448604f90903bbc3b50457f78601cf11a034cd22
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.04092838987708092,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
|
4 |
-
"epoch": 1.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -19142,11 +19142,100 @@
|
|
19142 |
"eval_steps_per_second": 0.75,
|
19143 |
"num_input_tokens_seen": 71837520,
|
19144 |
"step": 10750
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19145 |
}
|
19146 |
],
|
19147 |
"logging_steps": 5,
|
19148 |
"max_steps": 16324,
|
19149 |
-
"num_input_tokens_seen":
|
19150 |
"num_train_epochs": 2,
|
19151 |
"save_steps": 50,
|
19152 |
"stateful_callbacks": {
|
@@ -19161,7 +19250,7 @@
|
|
19161 |
"attributes": {}
|
19162 |
}
|
19163 |
},
|
19164 |
-
"total_flos":
|
19165 |
"train_batch_size": 1,
|
19166 |
"trial_name": null,
|
19167 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.04092838987708092,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
|
4 |
+
"epoch": 1.3231754004471532,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 10800,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
19142 |
"eval_steps_per_second": 0.75,
|
19143 |
"num_input_tokens_seen": 71837520,
|
19144 |
"step": 10750
|
19145 |
+
},
|
19146 |
+
{
|
19147 |
+
"epoch": 1.3176625524486232,
|
19148 |
+
"grad_norm": 1.1943825653656646,
|
19149 |
+
"learning_rate": 2.858719744588928e-05,
|
19150 |
+
"loss": 0.1921,
|
19151 |
+
"num_input_tokens_seen": 71870856,
|
19152 |
+
"step": 10755
|
19153 |
+
},
|
19154 |
+
{
|
19155 |
+
"epoch": 1.3182750911151266,
|
19156 |
+
"grad_norm": 1.2513095958234757,
|
19157 |
+
"learning_rate": 2.854144001950314e-05,
|
19158 |
+
"loss": 0.1655,
|
19159 |
+
"num_input_tokens_seen": 71904984,
|
19160 |
+
"step": 10760
|
19161 |
+
},
|
19162 |
+
{
|
19163 |
+
"epoch": 1.31888762978163,
|
19164 |
+
"grad_norm": 0.9949634903926544,
|
19165 |
+
"learning_rate": 2.8495704611464275e-05,
|
19166 |
+
"loss": 0.1703,
|
19167 |
+
"num_input_tokens_seen": 71939480,
|
19168 |
+
"step": 10765
|
19169 |
+
},
|
19170 |
+
{
|
19171 |
+
"epoch": 1.3195001684481333,
|
19172 |
+
"grad_norm": 1.1828002010795184,
|
19173 |
+
"learning_rate": 2.8449991268701208e-05,
|
19174 |
+
"loss": 0.2253,
|
19175 |
+
"num_input_tokens_seen": 71973360,
|
19176 |
+
"step": 10770
|
19177 |
+
},
|
19178 |
+
{
|
19179 |
+
"epoch": 1.3201127071146366,
|
19180 |
+
"grad_norm": 1.375476605140409,
|
19181 |
+
"learning_rate": 2.8404300038119825e-05,
|
19182 |
+
"loss": 0.2047,
|
19183 |
+
"num_input_tokens_seen": 72007440,
|
19184 |
+
"step": 10775
|
19185 |
+
},
|
19186 |
+
{
|
19187 |
+
"epoch": 1.3207252457811398,
|
19188 |
+
"grad_norm": 1.1086035003719277,
|
19189 |
+
"learning_rate": 2.835863096660325e-05,
|
19190 |
+
"loss": 0.1839,
|
19191 |
+
"num_input_tokens_seen": 72041328,
|
19192 |
+
"step": 10780
|
19193 |
+
},
|
19194 |
+
{
|
19195 |
+
"epoch": 1.3213377844476433,
|
19196 |
+
"grad_norm": 1.202221399382527,
|
19197 |
+
"learning_rate": 2.8312984101011946e-05,
|
19198 |
+
"loss": 0.2406,
|
19199 |
+
"num_input_tokens_seen": 72074904,
|
19200 |
+
"step": 10785
|
19201 |
+
},
|
19202 |
+
{
|
19203 |
+
"epoch": 1.3219503231141465,
|
19204 |
+
"grad_norm": 1.3913683968268147,
|
19205 |
+
"learning_rate": 2.826735948818358e-05,
|
19206 |
+
"loss": 0.2341,
|
19207 |
+
"num_input_tokens_seen": 72108648,
|
19208 |
+
"step": 10790
|
19209 |
+
},
|
19210 |
+
{
|
19211 |
+
"epoch": 1.32256286178065,
|
19212 |
+
"grad_norm": 1.8386972604975618,
|
19213 |
+
"learning_rate": 2.8221757174932938e-05,
|
19214 |
+
"loss": 0.2294,
|
19215 |
+
"num_input_tokens_seen": 72141880,
|
19216 |
+
"step": 10795
|
19217 |
+
},
|
19218 |
+
{
|
19219 |
+
"epoch": 1.3231754004471532,
|
19220 |
+
"grad_norm": 1.2668737312898322,
|
19221 |
+
"learning_rate": 2.817617720805197e-05,
|
19222 |
+
"loss": 0.2369,
|
19223 |
+
"num_input_tokens_seen": 72175680,
|
19224 |
+
"step": 10800
|
19225 |
+
},
|
19226 |
+
{
|
19227 |
+
"epoch": 1.3231754004471532,
|
19228 |
+
"eval_loss": 0.17310434579849243,
|
19229 |
+
"eval_runtime": 19.7821,
|
19230 |
+
"eval_samples_per_second": 3.033,
|
19231 |
+
"eval_steps_per_second": 0.758,
|
19232 |
+
"num_input_tokens_seen": 72175680,
|
19233 |
+
"step": 10800
|
19234 |
}
|
19235 |
],
|
19236 |
"logging_steps": 5,
|
19237 |
"max_steps": 16324,
|
19238 |
+
"num_input_tokens_seen": 72175680,
|
19239 |
"num_train_epochs": 2,
|
19240 |
"save_steps": 50,
|
19241 |
"stateful_callbacks": {
|
|
|
19250 |
"attributes": {}
|
19251 |
}
|
19252 |
},
|
19253 |
+
"total_flos": 4527150548385792.0,
|
19254 |
"train_batch_size": 1,
|
19255 |
"trial_name": null,
|
19256 |
"trial_params": null
|