ben81828 commited on
Commit
582a8b8
·
verified ·
1 Parent(s): 9119268

Training in progress, step 11200, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fbe11c8cfeee8afaad07093a52a298b4d54ead24b79f9d7147b4ac16e702d7d
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb613b7a256807ef338a6d86f6b8835264592147c48b1ceb1576db73a2d29ecf
3
  size 29034840
last-checkpoint/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a49247f7a5dbb85046813911c81b147441052c36d2a1ee9cf330b58471b6ff9
3
+ size 43429616
last-checkpoint/global_step11200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5ea2a7518990ad8edea9270a514be2de59223da7afa5f14537ec8573accee9b
3
+ size 43429616
last-checkpoint/global_step11200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:518e8c3960d9e5b06111d37f383dc862a7c2a612b5d6ee42b7603008462ca0d5
3
+ size 43429616
last-checkpoint/global_step11200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eed55d8d4ba5e0e6a9d2ac0877904297366897ddb65fdf29500074c993d14553
3
+ size 43429616
last-checkpoint/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dc65f41042186a6597d9e0506facac488c22fa317baaffddcedfd697058d8b5
3
+ size 637299
last-checkpoint/global_step11200/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e86839a06130ed51c7d0ca21cac3ad51f5eba0728a326c8a7a5c6a63a97ce158
3
+ size 637171
last-checkpoint/global_step11200/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a3aa91a406ac13e36de963177af8adf12c4b4d32962b627acf16fdaab4b58a2
3
+ size 637171
last-checkpoint/global_step11200/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c9805a34d4a0445d38244a8b34fcf2f5397c5a7d11ccca273a174e9bd667edc
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step11150
 
1
+ global_step11200
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3cad2c8b29e598e7e2ffcc6315ff1051f90214a6e97debdcd92d23904705b4a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5a58aaf06ec2b8eda78c5f2f2ac7148a98cae00fe24702bd54e14ca6f5a7216
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ca6102c873816870ffe4b66e9e18be91dca3aa16a90760134101413ffd75685
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e49b44e414e04e39f0702fc16eb809e710c1fb4097853c3426e644ce631651d
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:418c34b07fefc23a05efe584b58a927935a830386544b2611439d820010bd5b7
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acd3a64f00be04c08ec9e76003e026cd7fe1360420cba01612487f382a8779cc
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37bc6d29978d73b25002f388347dac14f60527042f328ee71a4c8e6b288a82b8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09a3abf68c456fd01db337f7f7a45adf467d83d959fd2e573783cb280ebc87f2
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:538ca13148fdaae10d2a4068d9e6e005cd6c9092b2043d01d85a688dfe8c7d39
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72262b6106604c5f1a98229085b73dca3b965e0b9c41eaabfcd828a3f9df568a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.04092838987708092,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
4
- "epoch": 1.3660531071023858,
5
  "eval_steps": 50,
6
- "global_step": 11150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -19854,11 +19854,100 @@
19854
  "eval_steps_per_second": 0.774,
19855
  "num_input_tokens_seen": 74528296,
19856
  "step": 11150
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19857
  }
19858
  ],
19859
  "logging_steps": 5,
19860
  "max_steps": 16324,
19861
- "num_input_tokens_seen": 74528296,
19862
  "num_train_epochs": 2,
19863
  "save_steps": 50,
19864
  "stateful_callbacks": {
@@ -19873,7 +19962,7 @@
19873
  "attributes": {}
19874
  }
19875
  },
19876
- "total_flos": 4674728332099584.0,
19877
  "train_batch_size": 1,
19878
  "trial_name": null,
19879
  "trial_params": null
 
1
  {
2
  "best_metric": 0.04092838987708092,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
4
+ "epoch": 1.372178493767419,
5
  "eval_steps": 50,
6
+ "global_step": 11200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
19854
  "eval_steps_per_second": 0.774,
19855
  "num_input_tokens_seen": 74528296,
19856
  "step": 11150
19857
+ },
19858
+ {
19859
+ "epoch": 1.3666656457688893,
19860
+ "grad_norm": 1.1954091110116585,
19861
+ "learning_rate": 2.500000000000001e-05,
19862
+ "loss": 0.1971,
19863
+ "num_input_tokens_seen": 74562368,
19864
+ "step": 11155
19865
+ },
19866
+ {
19867
+ "epoch": 1.3672781844353925,
19868
+ "grad_norm": 1.448181363417585,
19869
+ "learning_rate": 2.4956150399745375e-05,
19870
+ "loss": 0.2395,
19871
+ "num_input_tokens_seen": 74596328,
19872
+ "step": 11160
19873
+ },
19874
+ {
19875
+ "epoch": 1.3678907231018957,
19876
+ "grad_norm": 2.1272140492982055,
19877
+ "learning_rate": 2.4912326496656762e-05,
19878
+ "loss": 0.2587,
19879
+ "num_input_tokens_seen": 74629408,
19880
+ "step": 11165
19881
+ },
19882
+ {
19883
+ "epoch": 1.3685032617683992,
19884
+ "grad_norm": 1.2118543871719263,
19885
+ "learning_rate": 2.4868528335701275e-05,
19886
+ "loss": 0.2276,
19887
+ "num_input_tokens_seen": 74662920,
19888
+ "step": 11170
19889
+ },
19890
+ {
19891
+ "epoch": 1.3691158004349024,
19892
+ "grad_norm": 1.5201689858137362,
19893
+ "learning_rate": 2.4824755961819647e-05,
19894
+ "loss": 0.2238,
19895
+ "num_input_tokens_seen": 74696728,
19896
+ "step": 11175
19897
+ },
19898
+ {
19899
+ "epoch": 1.369728339101406,
19900
+ "grad_norm": 1.6964360928117685,
19901
+ "learning_rate": 2.478100941992613e-05,
19902
+ "loss": 0.2288,
19903
+ "num_input_tokens_seen": 74730448,
19904
+ "step": 11180
19905
+ },
19906
+ {
19907
+ "epoch": 1.3703408777679091,
19908
+ "grad_norm": 1.0971640842186783,
19909
+ "learning_rate": 2.4737288754908517e-05,
19910
+ "loss": 0.2066,
19911
+ "num_input_tokens_seen": 74764088,
19912
+ "step": 11185
19913
+ },
19914
+ {
19915
+ "epoch": 1.3709534164344124,
19916
+ "grad_norm": 0.9738244569482346,
19917
+ "learning_rate": 2.469359401162795e-05,
19918
+ "loss": 0.2158,
19919
+ "num_input_tokens_seen": 74797488,
19920
+ "step": 11190
19921
+ },
19922
+ {
19923
+ "epoch": 1.3715659551009156,
19924
+ "grad_norm": 1.1636541723418108,
19925
+ "learning_rate": 2.4649925234919063e-05,
19926
+ "loss": 0.1934,
19927
+ "num_input_tokens_seen": 74830920,
19928
+ "step": 11195
19929
+ },
19930
+ {
19931
+ "epoch": 1.372178493767419,
19932
+ "grad_norm": 1.107536927721727,
19933
+ "learning_rate": 2.4606282469589837e-05,
19934
+ "loss": 0.1875,
19935
+ "num_input_tokens_seen": 74864760,
19936
+ "step": 11200
19937
+ },
19938
+ {
19939
+ "epoch": 1.372178493767419,
19940
+ "eval_loss": 0.15537530183792114,
19941
+ "eval_runtime": 19.755,
19942
+ "eval_samples_per_second": 3.037,
19943
+ "eval_steps_per_second": 0.759,
19944
+ "num_input_tokens_seen": 74864760,
19945
+ "step": 11200
19946
  }
19947
  ],
19948
  "logging_steps": 5,
19949
  "max_steps": 16324,
19950
+ "num_input_tokens_seen": 74864760,
19951
  "num_train_epochs": 2,
19952
  "save_steps": 50,
19953
  "stateful_callbacks": {
 
19962
  "attributes": {}
19963
  }
19964
  },
19965
+ "total_flos": 4695845966708736.0,
19966
  "train_batch_size": 1,
19967
  "trial_name": null,
19968
  "trial_params": null