Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +0 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/000-GPT-XL/log.txt +10 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/001-GPT-XL/log.txt +18 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/003-GPT-XL/log.txt +4 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_4_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_5_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_6_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_7_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_8_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/log.txt +99 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/0046000.pt +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_24000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_24000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_24000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
.gitattributes
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/000-GPT-XL/log.txt
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[[34m2025-04-23 09:11:27[0m] Experiment directory created at checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/000-GPT-XL
|
2 |
+
[[34m2025-04-23 09:11:27[0m] Namespace(data_path='/tmp/haozhezhao/MLLMG/jsonl_data/merged_train_set_set_subject_400k_recap_t2i_400k_flux_200k_midjourney_150k_recovery_150k_grounding_100fluxseg_50samseg.jsonl', cloud_save_path='/tmp/haozhezhao/checkpoint', no_local_save=False, vq_model='VQ-16', vq_ckpt='/tmp/haozhezhao/model/llamagen_t2i/vq_ds16_t2i.pt', codebook_size=16384, codebook_embed_dim=8, gpt_model='GPT-XL', gpt_ckpt='/tmp/haozhezhao/MLLMG_ckpkts/checkpoints/AfterI2I_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_empty_fix_train_all/0100000.pt', gpt_type='t2i', vocab_size=16384, cls_token_num=512, dropout_p=0.1, token_dropout_p=0.1, drop_path=0.0, no_compile=False, results_dir='checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated', dataset='ti2i', image_size=512, downsample_size=16, num_classes=1000, epochs=2, lr=0.0003, weight_decay=0.05, beta1=0.9, beta2=0.95, max_grad_norm=1.0, global_batch_size=64, global_seed=0, num_workers=8, log_every=25, ckpt_every=2000, gradient_accumulation_steps=4, mixed_precision='bf16', val_data_path='/tmp/haozhezhao/MLLMG/jsonl_data/dreambench_plus_valid.jsonl', use_vision_tower=True, model_name_or_path='/tmp/haozhezhao/model/blip2-flan-t5-xl', image_place_holder='<image>', processor_path=None, do_eval=True, max_eval_samples=500, train_text_encoder=True, no_left_padding=False, cfg_scale=7.5, top_k=16384, temperature=0.9, top_p=1.0, eval_steps=2000, project_name='llamagen_ti2i', load_from_checkpoint='/tmp/haozhezhao/MLLMG/checkpoint/FIXed_3M_1epoch_step32000.pt', warmup=0.05, lr_decay_style='cosine', lr_decay_ratio=0.1, train_iters=500000, class_dropout_prob=0.1, with_image_only=False, image_only_rate=0.1, stage2=False, subject_driven=True, load_subject_embedding=None, reference_data_path='/tmp/haozhezhao/MLLMG/cc12m_reference_tunnel.jsonl', multimodal_encoder='llava', do_recovery=True, no_replace=False, resume=False, dreambench_eval=True, find_unused_parameters=True, load_visual_encoder=False, continue_stage1=False, replace_subject=False, train_all=True, save_total_limit=1, load_language_projection='/tmp/haozhezhao/MLLMG/llava-v1.5-flant5_fixed-pretrain/mm_projector.bin', mm_vision_tower='openai/clip-vit-large-patch14', load_fixed_llamagen=True, unfreeze_output=False, fix='gpt-empty-fix', rank=0, world_size=8, gpu=0, dist_url='env://', distributed=True, dist_backend='nccl')
|
3 |
+
[[34m2025-04-23 09:11:27[0m] Starting rank=0, seed=0, world_size=8.
|
4 |
+
[[34m2025-04-23 09:11:27[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
5 |
+
[[34m2025-04-23 09:12:39[0m] GPT Parameters: 2,310,680,832
|
6 |
+
[[34m2025-04-23 09:12:39[0m] num decayed parameter tensors: 356, with 2,007,303,168 parameters
|
7 |
+
[[34m2025-04-23 09:12:39[0m] num non-decayed parameter tensors: 124, with 197,888 parameters
|
8 |
+
[[34m2025-04-23 09:12:39[0m] using fused AdamW: True
|
9 |
+
[[34m2025-04-23 09:12:49[0m] Dataset contains 1,313,682 images
|
10 |
+
[[34m2025-04-23 09:12:49[0m] Train iters 41052 , warmup 2052.6, len of loader 20526
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/001-GPT-XL/log.txt
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[[34m2025-04-23 10:50:20[0m] Experiment directory created at checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/001-GPT-XL
|
2 |
+
[[34m2025-04-23 10:50:20[0m] Namespace(data_path='/tmp/haozhezhao/MLLMG/jsonl_data/merged_train_set_set_subject_400k_recap_t2i_400k_flux_200k_midjourney_150k_recovery_150k_grounding_100fluxseg_50samseg.jsonl', cloud_save_path='/tmp/haozhezhao/checkpoint', no_local_save=False, vq_model='VQ-16', vq_ckpt='/tmp/haozhezhao/model/llamagen_t2i/vq_ds16_t2i.pt', codebook_size=16384, codebook_embed_dim=8, gpt_model='GPT-XL', gpt_ckpt='/tmp/haozhezhao/MLLMG/MLLMG_ckpts/checkpoints/AfterI2I_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_empty_fix_train_all/0100000.pt', gpt_type='t2i', vocab_size=16384, cls_token_num=512, dropout_p=0.1, token_dropout_p=0.1, drop_path=0.0, no_compile=False, results_dir='checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated', dataset='ti2i', image_size=512, downsample_size=16, num_classes=1000, epochs=2, lr=0.0003, weight_decay=0.05, beta1=0.9, beta2=0.95, max_grad_norm=1.0, global_batch_size=64, global_seed=0, num_workers=8, log_every=25, ckpt_every=2000, gradient_accumulation_steps=4, mixed_precision='bf16', val_data_path='/tmp/haozhezhao/MLLMG/jsonl_data/dreambench_plus_valid.jsonl', use_vision_tower=True, model_name_or_path='/tmp/haozhezhao/model/blip2-flan-t5-xl', image_place_holder='<image>', processor_path=None, do_eval=True, max_eval_samples=500, train_text_encoder=True, no_left_padding=False, cfg_scale=7.5, top_k=16384, temperature=0.9, top_p=1.0, eval_steps=2000, project_name='llamagen_ti2i', load_from_checkpoint='/tmp/haozhezhao/MLLMG/checkpoint/FIXed_3M_1epoch_step32000.pt', warmup=0.05, lr_decay_style='cosine', lr_decay_ratio=0.1, train_iters=500000, class_dropout_prob=0.1, with_image_only=False, image_only_rate=0.1, stage2=False, subject_driven=True, load_subject_embedding=None, reference_data_path='/tmp/haozhezhao/MLLMG/cc12m_reference_tunnel.jsonl', multimodal_encoder='llava', do_recovery=True, no_replace=False, resume=False, dreambench_eval=True, find_unused_parameters=True, load_visual_encoder=False, continue_stage1=False, replace_subject=False, train_all=True, save_total_limit=1, load_language_projection='/tmp/haozhezhao/MLLMG/llava-v1.5-flant5_fixed-pretrain/mm_projector.bin', mm_vision_tower='openai/clip-vit-large-patch14', load_fixed_llamagen=True, unfreeze_output=False, fix='gpt-empty-fix', rank=0, world_size=8, gpu=0, dist_url='env://', distributed=True, dist_backend='nccl')
|
3 |
+
[[34m2025-04-23 10:50:20[0m] Starting rank=0, seed=0, world_size=8.
|
4 |
+
[[34m2025-04-23 10:50:20[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
5 |
+
[[34m2025-04-23 10:51:26[0m] GPT Parameters: 2,310,680,832
|
6 |
+
[[34m2025-04-23 10:51:26[0m] num decayed parameter tensors: 356, with 2,007,303,168 parameters
|
7 |
+
[[34m2025-04-23 10:51:26[0m] num non-decayed parameter tensors: 124, with 197,888 parameters
|
8 |
+
[[34m2025-04-23 10:51:26[0m] using fused AdamW: True
|
9 |
+
[[34m2025-04-23 10:51:35[0m] Dataset contains 1,313,682 images
|
10 |
+
[[34m2025-04-23 10:51:35[0m] Train iters 41052 , warmup 2052.6, len of loader 20526
|
11 |
+
[[34m2025-04-23 10:52:03[0m] ### LOAD pretraining weights from checkpoint: /tmp/haozhezhao/MLLMG/MLLMG_ckpts/checkpoints/AfterI2I_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_empty_fix_train_all/0100000.pt
|
12 |
+
[[34m2025-04-23 10:52:03[0m] Initial state: steps=0, epochs=0
|
13 |
+
[[34m2025-04-23 10:52:03[0m] compiling the model... (may take several minutes)
|
14 |
+
[[34m2025-04-23 10:52:04[0m] freeze the vit
|
15 |
+
[[34m2025-04-23 10:52:04[0m] ***** total param is 2310680832 *****
|
16 |
+
[[34m2025-04-23 10:52:04[0m] ***** total trained param is 2007501056 *****
|
17 |
+
[[34m2025-04-23 10:52:06[0m] Training for 2 epochs...
|
18 |
+
[[34m2025-04-23 10:52:06[0m] Beginning epoch 0...
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/003-GPT-XL/log.txt
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[[34m2025-04-23 11:01:15[0m] Experiment directory created at checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/003-GPT-XL
|
2 |
+
[[34m2025-04-23 11:01:15[0m] Namespace(data_path='/tmp/haozhezhao/MLLMG/jsonl_data/merged_train_set_set_subject_400k_recap_t2i_400k_flux_200k_midjourney_150k_recovery_150k_grounding_100fluxseg_50samseg.jsonl', cloud_save_path='/tmp/haozhezhao/checkpoint', no_local_save=False, vq_model='VQ-16', vq_ckpt='/tmp/haozhezhao/model/llamagen_t2i/vq_ds16_t2i.pt', codebook_size=16384, codebook_embed_dim=8, gpt_model='GPT-XL', gpt_ckpt='/tmp/haozhezhao/MLLMG/MLLMG_ckpts/checkpoints/AfterI2I_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_empty_fix_train_all/0100000.pt', gpt_type='t2i', vocab_size=16384, cls_token_num=512, dropout_p=0.1, token_dropout_p=0.1, drop_path=0.0, no_compile=False, results_dir='checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated', dataset='ti2i', image_size=512, downsample_size=16, num_classes=1000, epochs=2, lr=0.0003, weight_decay=0.05, beta1=0.9, beta2=0.95, max_grad_norm=1.0, global_batch_size=64, global_seed=0, num_workers=8, log_every=25, ckpt_every=2000, gradient_accumulation_steps=4, mixed_precision='bf16', val_data_path='/tmp/haozhezhao/MLLMG/jsonl_data/dreambench_plus_valid.jsonl', use_vision_tower=True, model_name_or_path='/tmp/haozhezhao/model/blip2-flan-t5-xl', image_place_holder='<image>', processor_path=None, do_eval=True, max_eval_samples=500, train_text_encoder=True, no_left_padding=False, cfg_scale=7.5, top_k=16384, temperature=0.9, top_p=1.0, eval_steps=2000, project_name='llamagen_ti2i', load_from_checkpoint='/tmp/haozhezhao/MLLMG/checkpoint/FIXed_3M_1epoch_step32000.pt', warmup=0.05, lr_decay_style='cosine', lr_decay_ratio=0.1, train_iters=500000, class_dropout_prob=0.1, with_image_only=False, image_only_rate=0.1, stage2=False, subject_driven=True, load_subject_embedding=None, reference_data_path='/tmp/haozhezhao/MLLMG/cc12m_reference_tunnel.jsonl', multimodal_encoder='llava', do_recovery=True, no_replace=False, resume=False, dreambench_eval=True, find_unused_parameters=True, load_visual_encoder=False, continue_stage1=False, replace_subject=False, train_all=True, save_total_limit=1, load_language_projection='/tmp/haozhezhao/MLLMG/llava-v1.5-flant5_fixed-pretrain/mm_projector.bin', mm_vision_tower='openai/clip-vit-large-patch14', load_fixed_llamagen=True, unfreeze_output=False, fix='gpt-empty-fix', rank=0, world_size=8, gpu=0, dist_url='env://', distributed=True, dist_backend='nccl')
|
3 |
+
[[34m2025-04-23 11:01:15[0m] Starting rank=0, seed=0, world_size=8.
|
4 |
+
[[34m2025-04-23 11:01:15[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_4_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_5_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_6_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_7_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/checkpoints/eval_step_2000/batch_8_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL/log.txt
ADDED
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[[34m2025-04-23 11:12:04[0m] Experiment directory created at checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/004-GPT-XL
|
2 |
+
[[34m2025-04-23 11:12:04[0m] Namespace(data_path='/tmp/haozhezhao/MLLMG/jsonl_data/merged_train_set_set_subject_400k_recap_t2i_400k_flux_200k_midjourney_150k_recovery_150k_grounding_100fluxseg_50samseg.jsonl', cloud_save_path='/tmp/haozhezhao/checkpoint', no_local_save=False, vq_model='VQ-16', vq_ckpt='/tmp/haozhezhao/model/llamagen_t2i/vq_ds16_t2i.pt', codebook_size=16384, codebook_embed_dim=8, gpt_model='GPT-XL', gpt_ckpt='/tmp/haozhezhao/MLLMG/MLLMG_ckpts/checkpoints/AfterI2I_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_empty_fix_train_all/0100000.pt', gpt_type='t2i', vocab_size=16384, cls_token_num=512, dropout_p=0.1, token_dropout_p=0.1, drop_path=0.0, no_compile=False, results_dir='checkpoint/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated', dataset='ti2i', image_size=512, downsample_size=16, num_classes=1000, epochs=2, lr=0.0003, weight_decay=0.05, beta1=0.9, beta2=0.95, max_grad_norm=1.0, global_batch_size=56, global_seed=0, num_workers=8, log_every=25, ckpt_every=2000, gradient_accumulation_steps=4, mixed_precision='bf16', val_data_path='/tmp/haozhezhao/MLLMG/jsonl_data/dreambench_plus_valid.jsonl', use_vision_tower=True, model_name_or_path='/tmp/haozhezhao/model/blip2-flan-t5-xl', image_place_holder='<image>', processor_path=None, do_eval=True, max_eval_samples=500, train_text_encoder=True, no_left_padding=False, cfg_scale=7.5, top_k=16384, temperature=0.9, top_p=1.0, eval_steps=2000, project_name='llamagen_ti2i', load_from_checkpoint='/tmp/haozhezhao/MLLMG/checkpoint/FIXed_3M_1epoch_step32000.pt', warmup=0.05, lr_decay_style='cosine', lr_decay_ratio=0.1, train_iters=500000, class_dropout_prob=0.1, with_image_only=False, image_only_rate=0.1, stage2=False, subject_driven=True, load_subject_embedding=None, reference_data_path='/tmp/haozhezhao/MLLMG/cc12m_reference_tunnel.jsonl', multimodal_encoder='llava', do_recovery=True, no_replace=False, resume=False, dreambench_eval=True, find_unused_parameters=True, load_visual_encoder=False, continue_stage1=False, replace_subject=False, train_all=True, save_total_limit=1, load_language_projection='/tmp/haozhezhao/MLLMG/llava-v1.5-flant5_fixed-pretrain/mm_projector.bin', mm_vision_tower='openai/clip-vit-large-patch14', load_fixed_llamagen=True, unfreeze_output=False, fix='gpt-empty-fix', rank=0, world_size=8, gpu=0, dist_url='env://', distributed=True, dist_backend='nccl')
|
3 |
+
[[34m2025-04-23 11:12:04[0m] Starting rank=0, seed=0, world_size=8.
|
4 |
+
[[34m2025-04-23 11:12:04[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
5 |
+
[[34m2025-04-23 11:13:13[0m] GPT Parameters: 2,310,680,832
|
6 |
+
[[34m2025-04-23 11:13:13[0m] num decayed parameter tensors: 356, with 2,007,303,168 parameters
|
7 |
+
[[34m2025-04-23 11:13:13[0m] num non-decayed parameter tensors: 124, with 197,888 parameters
|
8 |
+
[[34m2025-04-23 11:13:13[0m] using fused AdamW: True
|
9 |
+
[[34m2025-04-23 11:13:22[0m] Dataset contains 1,313,682 images
|
10 |
+
[[34m2025-04-23 11:13:22[0m] Train iters 46916 , warmup 2345.8, len of loader 23458
|
11 |
+
[[34m2025-04-23 11:13:38[0m] ### LOAD pretraining weights from checkpoint: /tmp/haozhezhao/MLLMG/MLLMG_ckpts/checkpoints/AfterI2I_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_empty_fix_train_all/0100000.pt
|
12 |
+
[[34m2025-04-23 11:13:38[0m] Initial state: steps=0, epochs=0
|
13 |
+
[[34m2025-04-23 11:13:38[0m] compiling the model... (may take several minutes)
|
14 |
+
[[34m2025-04-23 11:13:39[0m] freeze the vit
|
15 |
+
[[34m2025-04-23 11:13:39[0m] ***** total param is 2310680832 *****
|
16 |
+
[[34m2025-04-23 11:13:39[0m] ***** total trained param is 2007501056 *****
|
17 |
+
[[34m2025-04-23 11:13:40[0m] Training for 2 epochs...
|
18 |
+
[[34m2025-04-23 11:13:40[0m] Beginning epoch 0...
|
19 |
+
[[34m2025-04-23 11:18:40[0m] (step=0000025) Train Loss: 6.6005, Train Steps/Sec: 0.08
|
20 |
+
[[34m2025-04-23 11:19:29[0m] (step=0000050) Train Loss: 6.6556, Train Steps/Sec: 0.51
|
21 |
+
[[34m2025-04-23 11:21:08[0m] (step=0000075) Train Loss: 6.4599, Train Steps/Sec: 0.25
|
22 |
+
[[34m2025-04-23 11:22:11[0m] (step=0000100) Train Loss: 6.3558, Train Steps/Sec: 0.40
|
23 |
+
[[34m2025-04-23 11:22:33[0m] (step=0000125) Train Loss: 6.2557, Train Steps/Sec: 1.17
|
24 |
+
[[34m2025-04-23 11:23:23[0m] (step=0000150) Train Loss: 6.1054, Train Steps/Sec: 0.50
|
25 |
+
[[34m2025-04-23 11:24:13[0m] (step=0000175) Train Loss: 6.1218, Train Steps/Sec: 0.50
|
26 |
+
[[34m2025-04-23 11:24:35[0m] (step=0000200) Train Loss: 6.0449, Train Steps/Sec: 1.15
|
27 |
+
[[34m2025-04-23 11:24:56[0m] (step=0000225) Train Loss: 5.9306, Train Steps/Sec: 1.17
|
28 |
+
[[34m2025-04-23 11:25:46[0m] (step=0000250) Train Loss: 5.8833, Train Steps/Sec: 0.50
|
29 |
+
[[34m2025-04-23 11:27:04[0m] (step=0000275) Train Loss: 5.9763, Train Steps/Sec: 0.32
|
30 |
+
[[34m2025-04-23 11:27:25[0m] (step=0000300) Train Loss: 5.8122, Train Steps/Sec: 1.17
|
31 |
+
[[34m2025-04-23 11:27:47[0m] (step=0000325) Train Loss: 5.9543, Train Steps/Sec: 1.17
|
32 |
+
[[34m2025-04-23 11:28:08[0m] (step=0000350) Train Loss: 5.8445, Train Steps/Sec: 1.17
|
33 |
+
[[34m2025-04-23 11:28:29[0m] (step=0000375) Train Loss: 5.8658, Train Steps/Sec: 1.17
|
34 |
+
[[34m2025-04-23 11:29:20[0m] (step=0000400) Train Loss: 5.7741, Train Steps/Sec: 0.49
|
35 |
+
[[34m2025-04-23 11:29:41[0m] (step=0000425) Train Loss: 5.8472, Train Steps/Sec: 1.17
|
36 |
+
[[34m2025-04-23 11:30:03[0m] (step=0000450) Train Loss: 5.8283, Train Steps/Sec: 1.17
|
37 |
+
[[34m2025-04-23 11:30:25[0m] (step=0000475) Train Loss: 5.8059, Train Steps/Sec: 1.12
|
38 |
+
[[34m2025-04-23 11:30:46[0m] (step=0000500) Train Loss: 5.8193, Train Steps/Sec: 1.17
|
39 |
+
[[34m2025-04-23 11:31:08[0m] (step=0000525) Train Loss: 5.8235, Train Steps/Sec: 1.17
|
40 |
+
[[34m2025-04-23 11:31:29[0m] (step=0000550) Train Loss: 5.8375, Train Steps/Sec: 1.17
|
41 |
+
[[34m2025-04-23 11:31:50[0m] (step=0000575) Train Loss: 5.8427, Train Steps/Sec: 1.17
|
42 |
+
[[34m2025-04-23 11:32:12[0m] (step=0000600) Train Loss: 5.7903, Train Steps/Sec: 1.16
|
43 |
+
[[34m2025-04-23 11:32:33[0m] (step=0000625) Train Loss: 5.8660, Train Steps/Sec: 1.17
|
44 |
+
[[34m2025-04-23 11:32:55[0m] (step=0000650) Train Loss: 5.7774, Train Steps/Sec: 1.17
|
45 |
+
[[34m2025-04-23 11:33:16[0m] (step=0000675) Train Loss: 5.7929, Train Steps/Sec: 1.17
|
46 |
+
[[34m2025-04-23 11:33:37[0m] (step=0000700) Train Loss: 5.9227, Train Steps/Sec: 1.17
|
47 |
+
[[34m2025-04-23 11:33:59[0m] (step=0000725) Train Loss: 5.7613, Train Steps/Sec: 1.17
|
48 |
+
[[34m2025-04-23 11:34:21[0m] (step=0000750) Train Loss: 5.8464, Train Steps/Sec: 1.11
|
49 |
+
[[34m2025-04-23 11:34:42[0m] (step=0000775) Train Loss: 5.8326, Train Steps/Sec: 1.17
|
50 |
+
[[34m2025-04-23 11:35:05[0m] (step=0000800) Train Loss: 5.7977, Train Steps/Sec: 1.11
|
51 |
+
[[34m2025-04-23 11:35:26[0m] (step=0000825) Train Loss: 5.7656, Train Steps/Sec: 1.17
|
52 |
+
[[34m2025-04-23 11:35:48[0m] (step=0000850) Train Loss: 5.7243, Train Steps/Sec: 1.17
|
53 |
+
[[34m2025-04-23 11:36:11[0m] (step=0000875) Train Loss: 5.7829, Train Steps/Sec: 1.07
|
54 |
+
[[34m2025-04-23 11:36:34[0m] (step=0000900) Train Loss: 5.7715, Train Steps/Sec: 1.10
|
55 |
+
[[34m2025-04-23 11:36:55[0m] (step=0000925) Train Loss: 5.8266, Train Steps/Sec: 1.17
|
56 |
+
[[34m2025-04-23 11:37:16[0m] (step=0000950) Train Loss: 5.8739, Train Steps/Sec: 1.17
|
57 |
+
[[34m2025-04-23 11:37:37[0m] (step=0000975) Train Loss: 5.7752, Train Steps/Sec: 1.17
|
58 |
+
[[34m2025-04-23 11:37:59[0m] (step=0001000) Train Loss: 5.7676, Train Steps/Sec: 1.17
|
59 |
+
[[34m2025-04-23 11:38:22[0m] (step=0001025) Train Loss: 5.7233, Train Steps/Sec: 1.06
|
60 |
+
[[34m2025-04-23 11:38:44[0m] (step=0001050) Train Loss: 5.7606, Train Steps/Sec: 1.17
|
61 |
+
[[34m2025-04-23 11:39:05[0m] (step=0001075) Train Loss: 5.7211, Train Steps/Sec: 1.17
|
62 |
+
[[34m2025-04-23 11:39:26[0m] (step=0001100) Train Loss: 5.7764, Train Steps/Sec: 1.17
|
63 |
+
[[34m2025-04-23 11:39:48[0m] (step=0001125) Train Loss: 5.7317, Train Steps/Sec: 1.18
|
64 |
+
[[34m2025-04-23 11:40:10[0m] (step=0001150) Train Loss: 5.7573, Train Steps/Sec: 1.12
|
65 |
+
[[34m2025-04-23 11:40:31[0m] (step=0001175) Train Loss: 5.7894, Train Steps/Sec: 1.17
|
66 |
+
[[34m2025-04-23 11:40:53[0m] (step=0001200) Train Loss: 5.7181, Train Steps/Sec: 1.17
|
67 |
+
[[34m2025-04-23 11:41:14[0m] (step=0001225) Train Loss: 5.7548, Train Steps/Sec: 1.17
|
68 |
+
[[34m2025-04-23 11:41:35[0m] (step=0001250) Train Loss: 5.6894, Train Steps/Sec: 1.17
|
69 |
+
[[34m2025-04-23 11:41:57[0m] (step=0001275) Train Loss: 5.7133, Train Steps/Sec: 1.17
|
70 |
+
[[34m2025-04-23 11:42:18[0m] (step=0001300) Train Loss: 5.7372, Train Steps/Sec: 1.17
|
71 |
+
[[34m2025-04-23 11:42:39[0m] (step=0001325) Train Loss: 5.8133, Train Steps/Sec: 1.17
|
72 |
+
[[34m2025-04-23 11:43:01[0m] (step=0001350) Train Loss: 5.7414, Train Steps/Sec: 1.17
|
73 |
+
[[34m2025-04-23 11:43:22[0m] (step=0001375) Train Loss: 5.7914, Train Steps/Sec: 1.17
|
74 |
+
[[34m2025-04-23 11:43:44[0m] (step=0001400) Train Loss: 5.6661, Train Steps/Sec: 1.17
|
75 |
+
[[34m2025-04-23 11:44:05[0m] (step=0001425) Train Loss: 5.7186, Train Steps/Sec: 1.17
|
76 |
+
[[34m2025-04-23 11:44:26[0m] (step=0001450) Train Loss: 5.8405, Train Steps/Sec: 1.17
|
77 |
+
[[34m2025-04-23 11:44:48[0m] (step=0001475) Train Loss: 5.7429, Train Steps/Sec: 1.17
|
78 |
+
[[34m2025-04-23 11:45:09[0m] (step=0001500) Train Loss: 5.6897, Train Steps/Sec: 1.17
|
79 |
+
[[34m2025-04-23 11:45:30[0m] (step=0001525) Train Loss: 5.7404, Train Steps/Sec: 1.17
|
80 |
+
[[34m2025-04-23 11:45:53[0m] (step=0001550) Train Loss: 5.7304, Train Steps/Sec: 1.12
|
81 |
+
[[34m2025-04-23 11:46:14[0m] (step=0001575) Train Loss: 5.7393, Train Steps/Sec: 1.17
|
82 |
+
[[34m2025-04-23 11:46:35[0m] (step=0001600) Train Loss: 5.7214, Train Steps/Sec: 1.17
|
83 |
+
[[34m2025-04-23 11:46:58[0m] (step=0001625) Train Loss: 5.7278, Train Steps/Sec: 1.12
|
84 |
+
[[34m2025-04-23 11:47:21[0m] (step=0001650) Train Loss: 5.7655, Train Steps/Sec: 1.08
|
85 |
+
[[34m2025-04-23 11:47:42[0m] (step=0001675) Train Loss: 5.7132, Train Steps/Sec: 1.17
|
86 |
+
[[34m2025-04-23 11:48:05[0m] (step=0001700) Train Loss: 5.8445, Train Steps/Sec: 1.11
|
87 |
+
[[34m2025-04-23 11:48:26[0m] (step=0001725) Train Loss: 5.7540, Train Steps/Sec: 1.17
|
88 |
+
[[34m2025-04-23 11:48:48[0m] (step=0001750) Train Loss: 5.6806, Train Steps/Sec: 1.17
|
89 |
+
[[34m2025-04-23 11:49:10[0m] (step=0001775) Train Loss: 5.7114, Train Steps/Sec: 1.11
|
90 |
+
[[34m2025-04-23 11:49:32[0m] (step=0001800) Train Loss: 5.7751, Train Steps/Sec: 1.17
|
91 |
+
[[34m2025-04-23 11:49:53[0m] (step=0001825) Train Loss: 5.7199, Train Steps/Sec: 1.17
|
92 |
+
[[34m2025-04-23 11:50:16[0m] (step=0001850) Train Loss: 5.7680, Train Steps/Sec: 1.07
|
93 |
+
[[34m2025-04-23 11:50:38[0m] (step=0001875) Train Loss: 5.7145, Train Steps/Sec: 1.17
|
94 |
+
[[34m2025-04-23 11:50:59[0m] (step=0001900) Train Loss: 5.6735, Train Steps/Sec: 1.17
|
95 |
+
[[34m2025-04-23 11:51:20[0m] (step=0001925) Train Loss: 5.8258, Train Steps/Sec: 1.17
|
96 |
+
[[34m2025-04-23 11:51:42[0m] (step=0001950) Train Loss: 5.7326, Train Steps/Sec: 1.17
|
97 |
+
[[34m2025-04-23 11:52:03[0m] (step=0001975) Train Loss: 5.6651, Train Steps/Sec: 1.17
|
98 |
+
[[34m2025-04-23 11:52:25[0m] (step=0002000) Train Loss: 5.6799, Train Steps/Sec: 1.17
|
99 |
+
[[34m2025-04-23 11:52:25[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/0046000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d8a592e16377c249d4988c125dbe55d5d04d491fd305c8184ebb29e85d2eafc
|
3 |
+
size 17322479662
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_10000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_12000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_14000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_16000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_18000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_20000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_22000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_24000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_24000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|
CKPTS/Afteri2i_100kckpt_LLAVAT5_empty_Fixed_just_segment_pretrain_stage3_dreambench_recap_400k_t2i_400k_flux_200k_midjourney_150k_recovery_150k_3e4_epoch2_half_rotated/005-GPT-XL/checkpoints/eval_step_24000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
![]() |
Git LFS Details
|