Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- checkpoint-189000/config.json +79 -0
- checkpoint-189000/generation_config.json +6 -0
- checkpoint-189000/model.safetensors +3 -0
- checkpoint-189000/optimizer.pt +3 -0
- checkpoint-189000/rng_state_0.pth +3 -0
- checkpoint-189000/rng_state_1.pth +3 -0
- checkpoint-189000/rng_state_10.pth +3 -0
- checkpoint-189000/rng_state_11.pth +3 -0
- checkpoint-189000/rng_state_12.pth +3 -0
- checkpoint-189000/rng_state_13.pth +3 -0
- checkpoint-189000/rng_state_14.pth +3 -0
- checkpoint-189000/rng_state_15.pth +3 -0
- checkpoint-189000/rng_state_2.pth +3 -0
- checkpoint-189000/rng_state_3.pth +3 -0
- checkpoint-189000/rng_state_4.pth +3 -0
- checkpoint-189000/rng_state_5.pth +3 -0
- checkpoint-189000/rng_state_6.pth +3 -0
- checkpoint-189000/rng_state_7.pth +3 -0
- checkpoint-189000/rng_state_8.pth +3 -0
- checkpoint-189000/rng_state_9.pth +3 -0
- checkpoint-189000/scheduler.pt +3 -0
- checkpoint-189000/trainer_state.json +3 -0
- checkpoint-189000/training_args.bin +3 -0
- checkpoint-190000/config.json +79 -0
- checkpoint-190000/generation_config.json +6 -0
- checkpoint-190000/model.safetensors +3 -0
- checkpoint-190000/optimizer.pt +3 -0
- checkpoint-190000/rng_state_0.pth +3 -0
- checkpoint-190000/rng_state_1.pth +3 -0
- checkpoint-190000/rng_state_10.pth +3 -0
- checkpoint-190000/rng_state_11.pth +3 -0
- checkpoint-190000/rng_state_12.pth +3 -0
- checkpoint-190000/rng_state_13.pth +3 -0
- checkpoint-190000/rng_state_14.pth +3 -0
- checkpoint-190000/rng_state_15.pth +3 -0
- checkpoint-190000/rng_state_2.pth +3 -0
- checkpoint-190000/rng_state_3.pth +3 -0
- checkpoint-190000/rng_state_4.pth +3 -0
- checkpoint-190000/rng_state_5.pth +3 -0
- checkpoint-190000/rng_state_6.pth +3 -0
- checkpoint-190000/rng_state_7.pth +3 -0
- checkpoint-190000/rng_state_8.pth +3 -0
- checkpoint-190000/rng_state_9.pth +3 -0
- checkpoint-190000/scheduler.pt +3 -0
- checkpoint-190000/trainer_state.json +3 -0
- checkpoint-190000/training_args.bin +3 -0
    	
        .gitattributes
    CHANGED
    
    | @@ -75,3 +75,5 @@ checkpoint-177000/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| 75 | 
             
            checkpoint-178000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
| 76 | 
             
            checkpoint-179000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
| 77 | 
             
            checkpoint-180000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
|  | |
|  | 
|  | |
| 75 | 
             
            checkpoint-178000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
| 76 | 
             
            checkpoint-179000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
| 77 | 
             
            checkpoint-180000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
| 78 | 
            +
            checkpoint-189000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
| 79 | 
            +
            checkpoint-190000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
         | 
    	
        checkpoint-189000/config.json
    ADDED
    
    | @@ -0,0 +1,79 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "ar_steps": 1,
         | 
| 3 | 
            +
              "architectures": [
         | 
| 4 | 
            +
                "DiffVLMBaseline"
         | 
| 5 | 
            +
              ],
         | 
| 6 | 
            +
              "attention_dropout": 0.0,
         | 
| 7 | 
            +
              "bos_token_id": 151643,
         | 
| 8 | 
            +
              "condition_layer": -1,
         | 
| 9 | 
            +
              "eos_token_id": 151645,
         | 
| 10 | 
            +
              "hidden_act": "silu",
         | 
| 11 | 
            +
              "hidden_size": 1536,
         | 
| 12 | 
            +
              "image_token_id": 151655,
         | 
| 13 | 
            +
              "img_cross_attention_dim": 2048,
         | 
| 14 | 
            +
              "img_diffuser_depth": 2,
         | 
| 15 | 
            +
              "img_ffn_dim_multiplier": null,
         | 
| 16 | 
            +
              "img_hidden_size": 1536,
         | 
| 17 | 
            +
              "img_multiple_of": 256,
         | 
| 18 | 
            +
              "img_norm_eps": 1e-05,
         | 
| 19 | 
            +
              "img_num_attention_heads": 12,
         | 
| 20 | 
            +
              "img_num_kv_heads": 12,
         | 
| 21 | 
            +
              "img_qk_norm": true,
         | 
| 22 | 
            +
              "in_channels": 32,
         | 
| 23 | 
            +
              "initializer_range": 0.02,
         | 
| 24 | 
            +
              "inject_img_diffuser": false,
         | 
| 25 | 
            +
              "input_size": 32,
         | 
| 26 | 
            +
              "intermediate_size": 8960,
         | 
| 27 | 
            +
              "layer_group_size": 7,
         | 
| 28 | 
            +
              "layerwise_start_idx": 0,
         | 
| 29 | 
            +
              "lora_alpha": 128,
         | 
| 30 | 
            +
              "lora_bias": "none",
         | 
| 31 | 
            +
              "lora_dropout": 0.05,
         | 
| 32 | 
            +
              "lora_enable": false,
         | 
| 33 | 
            +
              "lora_r": 64,
         | 
| 34 | 
            +
              "max_position_embeddings": 32768,
         | 
| 35 | 
            +
              "max_window_layers": 28,
         | 
| 36 | 
            +
              "model_type": "qwen2_vl",
         | 
| 37 | 
            +
              "non_linearity": 1,
         | 
| 38 | 
            +
              "norm_elementwise_affine": true,
         | 
| 39 | 
            +
              "num_attention_heads": 12,
         | 
| 40 | 
            +
              "num_hidden_layers": 28,
         | 
| 41 | 
            +
              "num_key_value_heads": 2,
         | 
| 42 | 
            +
              "patch_size": 1,
         | 
| 43 | 
            +
              "repa_coeff": 0.1,
         | 
| 44 | 
            +
              "repa_layers": "2",
         | 
| 45 | 
            +
              "repa_shared": false,
         | 
| 46 | 
            +
              "rms_norm_eps": 1e-06,
         | 
| 47 | 
            +
              "rope_scaling": {
         | 
| 48 | 
            +
                "mrope_section": [
         | 
| 49 | 
            +
                  16,
         | 
| 50 | 
            +
                  24,
         | 
| 51 | 
            +
                  24
         | 
| 52 | 
            +
                ],
         | 
| 53 | 
            +
                "rope_type": "default",
         | 
| 54 | 
            +
                "type": "default"
         | 
| 55 | 
            +
              },
         | 
| 56 | 
            +
              "rope_theta": 1000000.0,
         | 
| 57 | 
            +
              "sample_size": 128,
         | 
| 58 | 
            +
              "sampling_steps": 28,
         | 
| 59 | 
            +
              "sliding_window": null,
         | 
| 60 | 
            +
              "tie_word_embeddings": true,
         | 
| 61 | 
            +
              "torch_dtype": "bfloat16",
         | 
| 62 | 
            +
              "transformers_version": "4.47.0",
         | 
| 63 | 
            +
              "use_cache": true,
         | 
| 64 | 
            +
              "use_repa": false,
         | 
| 65 | 
            +
              "use_residual_attn": false,
         | 
| 66 | 
            +
              "use_sliding_window": false,
         | 
| 67 | 
            +
              "vae_path": "mit-han-lab/dc-ae-f32c32-in-1.0-diffusers",
         | 
| 68 | 
            +
              "video_token_id": 151656,
         | 
| 69 | 
            +
              "vision_config": {
         | 
| 70 | 
            +
                "hidden_size": 1536,
         | 
| 71 | 
            +
                "in_chans": 3,
         | 
| 72 | 
            +
                "model_type": "qwen2_vl",
         | 
| 73 | 
            +
                "spatial_patch_size": 14
         | 
| 74 | 
            +
              },
         | 
| 75 | 
            +
              "vision_end_token_id": 151653,
         | 
| 76 | 
            +
              "vision_start_token_id": 151652,
         | 
| 77 | 
            +
              "vision_token_id": 151654,
         | 
| 78 | 
            +
              "vocab_size": 151936
         | 
| 79 | 
            +
            }
         | 
    	
        checkpoint-189000/generation_config.json
    ADDED
    
    | @@ -0,0 +1,6 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "_from_model_config": true,
         | 
| 3 | 
            +
              "bos_token_id": 151643,
         | 
| 4 | 
            +
              "eos_token_id": 151645,
         | 
| 5 | 
            +
              "transformers_version": "4.47.0"
         | 
| 6 | 
            +
            }
         | 
    	
        checkpoint-189000/model.safetensors
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:9f7110617fe408558a4d0b9a7fd47029b59155ce76a0b5cf8e3c99e640844a32
         | 
| 3 | 
            +
            size 4410723984
         | 
    	
        checkpoint-189000/optimizer.pt
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:9776474c4cde597885b28089551f00ce828308256194dc27c80b2e9e1ffad093
         | 
| 3 | 
            +
            size 6330255386
         | 
    	
        checkpoint-189000/rng_state_0.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:a23858ca64abcfa32b4d153270f98b1534e7587e557068c586e15979f4d471c4
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_1.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:102accde21f8ea2d7f303ebd85012f9d75c0e7276a595e23250e95414ea9d602
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_10.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:fda946800a4d9ae10c19e34225352d36309c23004191c99595bc5ab3784dbe27
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-189000/rng_state_11.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:8cfa4d339029c936a454271d5e4f728549561c7a1fd7c593d17709bf86bc1347
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-189000/rng_state_12.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:06d4239cdaeeccff0ff625ae1cd1b85fd7ec64a78fec72c1ebe09d5dbe2b3516
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-189000/rng_state_13.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:f318d479b839b110d1b290f2a261e047e2b27cd8e4de4c8012b2f57ee52e0a6f
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-189000/rng_state_14.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:b5c6dbe081ccc4328e216cd1debaa627e7099b241e3d11695a977954f7d3111e
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-189000/rng_state_15.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:f02ef0fc1084871015d0118f18863f19e1b37f4571feb7292d638388282c039b
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-189000/rng_state_2.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:990682ec08971859d3d70d31c1016ceccbaef04af7dc1f488c3aef047d58d72a
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_3.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6d9801e03f8547f118003d580af322fb553e21137c527a65b28807dc5d817439
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_4.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:8dc3d12bbc3ed882452b614a5053fe8098578e8dbb578fa25abe0d8cc5df42ac
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_5.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:faf86e435dd212e2d663bb10da5fed15e62a4b6fc6919e2f747823571ac6fe89
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_6.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:462071a04663bcc22db73f31cb84724d622c642a7fdf9b0053657fe124401012
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_7.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:5e1d11976e0f263531458c70dab4f4eb4e46730dccf58e69869eafa7012efef7
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_8.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:1fb496c387835f1cc8ca7154355b382b4a88107a364c74afba6e90f7d5291c73
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/rng_state_9.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:50ce7bc5cb42ae442f859c132a529f66d7ebea54c60ff72ecce40b311e209503
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-189000/scheduler.pt
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:81e40a233853d8f6b340ec187d9e25189af2a0fe3577bd26db1bd6a183253e91
         | 
| 3 | 
            +
            size 1064
         | 
    	
        checkpoint-189000/trainer_state.json
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:cbeddd823dac44846ac5c0fc7fcdcaf39f574fdc56eee3b4f7d122e37e4601e2
         | 
| 3 | 
            +
            size 28887734
         | 
    	
        checkpoint-189000/training_args.bin
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:140f442153cd686154b89333de70cc4a79cc2a18c8bdfdd020d6bb8e06e5d10a
         | 
| 3 | 
            +
            size 5944
         | 
    	
        checkpoint-190000/config.json
    ADDED
    
    | @@ -0,0 +1,79 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "ar_steps": 1,
         | 
| 3 | 
            +
              "architectures": [
         | 
| 4 | 
            +
                "DiffVLMBaseline"
         | 
| 5 | 
            +
              ],
         | 
| 6 | 
            +
              "attention_dropout": 0.0,
         | 
| 7 | 
            +
              "bos_token_id": 151643,
         | 
| 8 | 
            +
              "condition_layer": -1,
         | 
| 9 | 
            +
              "eos_token_id": 151645,
         | 
| 10 | 
            +
              "hidden_act": "silu",
         | 
| 11 | 
            +
              "hidden_size": 1536,
         | 
| 12 | 
            +
              "image_token_id": 151655,
         | 
| 13 | 
            +
              "img_cross_attention_dim": 2048,
         | 
| 14 | 
            +
              "img_diffuser_depth": 2,
         | 
| 15 | 
            +
              "img_ffn_dim_multiplier": null,
         | 
| 16 | 
            +
              "img_hidden_size": 1536,
         | 
| 17 | 
            +
              "img_multiple_of": 256,
         | 
| 18 | 
            +
              "img_norm_eps": 1e-05,
         | 
| 19 | 
            +
              "img_num_attention_heads": 12,
         | 
| 20 | 
            +
              "img_num_kv_heads": 12,
         | 
| 21 | 
            +
              "img_qk_norm": true,
         | 
| 22 | 
            +
              "in_channels": 32,
         | 
| 23 | 
            +
              "initializer_range": 0.02,
         | 
| 24 | 
            +
              "inject_img_diffuser": false,
         | 
| 25 | 
            +
              "input_size": 32,
         | 
| 26 | 
            +
              "intermediate_size": 8960,
         | 
| 27 | 
            +
              "layer_group_size": 7,
         | 
| 28 | 
            +
              "layerwise_start_idx": 0,
         | 
| 29 | 
            +
              "lora_alpha": 128,
         | 
| 30 | 
            +
              "lora_bias": "none",
         | 
| 31 | 
            +
              "lora_dropout": 0.05,
         | 
| 32 | 
            +
              "lora_enable": false,
         | 
| 33 | 
            +
              "lora_r": 64,
         | 
| 34 | 
            +
              "max_position_embeddings": 32768,
         | 
| 35 | 
            +
              "max_window_layers": 28,
         | 
| 36 | 
            +
              "model_type": "qwen2_vl",
         | 
| 37 | 
            +
              "non_linearity": 1,
         | 
| 38 | 
            +
              "norm_elementwise_affine": true,
         | 
| 39 | 
            +
              "num_attention_heads": 12,
         | 
| 40 | 
            +
              "num_hidden_layers": 28,
         | 
| 41 | 
            +
              "num_key_value_heads": 2,
         | 
| 42 | 
            +
              "patch_size": 1,
         | 
| 43 | 
            +
              "repa_coeff": 0.1,
         | 
| 44 | 
            +
              "repa_layers": "2",
         | 
| 45 | 
            +
              "repa_shared": false,
         | 
| 46 | 
            +
              "rms_norm_eps": 1e-06,
         | 
| 47 | 
            +
              "rope_scaling": {
         | 
| 48 | 
            +
                "mrope_section": [
         | 
| 49 | 
            +
                  16,
         | 
| 50 | 
            +
                  24,
         | 
| 51 | 
            +
                  24
         | 
| 52 | 
            +
                ],
         | 
| 53 | 
            +
                "rope_type": "default",
         | 
| 54 | 
            +
                "type": "default"
         | 
| 55 | 
            +
              },
         | 
| 56 | 
            +
              "rope_theta": 1000000.0,
         | 
| 57 | 
            +
              "sample_size": 128,
         | 
| 58 | 
            +
              "sampling_steps": 28,
         | 
| 59 | 
            +
              "sliding_window": null,
         | 
| 60 | 
            +
              "tie_word_embeddings": true,
         | 
| 61 | 
            +
              "torch_dtype": "bfloat16",
         | 
| 62 | 
            +
              "transformers_version": "4.47.0",
         | 
| 63 | 
            +
              "use_cache": true,
         | 
| 64 | 
            +
              "use_repa": false,
         | 
| 65 | 
            +
              "use_residual_attn": false,
         | 
| 66 | 
            +
              "use_sliding_window": false,
         | 
| 67 | 
            +
              "vae_path": "mit-han-lab/dc-ae-f32c32-in-1.0-diffusers",
         | 
| 68 | 
            +
              "video_token_id": 151656,
         | 
| 69 | 
            +
              "vision_config": {
         | 
| 70 | 
            +
                "hidden_size": 1536,
         | 
| 71 | 
            +
                "in_chans": 3,
         | 
| 72 | 
            +
                "model_type": "qwen2_vl",
         | 
| 73 | 
            +
                "spatial_patch_size": 14
         | 
| 74 | 
            +
              },
         | 
| 75 | 
            +
              "vision_end_token_id": 151653,
         | 
| 76 | 
            +
              "vision_start_token_id": 151652,
         | 
| 77 | 
            +
              "vision_token_id": 151654,
         | 
| 78 | 
            +
              "vocab_size": 151936
         | 
| 79 | 
            +
            }
         | 
    	
        checkpoint-190000/generation_config.json
    ADDED
    
    | @@ -0,0 +1,6 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "_from_model_config": true,
         | 
| 3 | 
            +
              "bos_token_id": 151643,
         | 
| 4 | 
            +
              "eos_token_id": 151645,
         | 
| 5 | 
            +
              "transformers_version": "4.47.0"
         | 
| 6 | 
            +
            }
         | 
    	
        checkpoint-190000/model.safetensors
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:8de753b5f2512f8b4d9faee5ed22e4c1e4e023439180cff94831dd75e4ee101d
         | 
| 3 | 
            +
            size 4410723984
         | 
    	
        checkpoint-190000/optimizer.pt
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:bf48b456b2f680635022e8b2a1dcee71fe8c09db56283e03caaa0882566fe3e0
         | 
| 3 | 
            +
            size 6330255386
         | 
    	
        checkpoint-190000/rng_state_0.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:86f7975d28c10fc73f0af41fdc7c63c5ccf3432edeb95766fd0417c2d2862fb8
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_1.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:455e92cac33d164c5e788d29e73d47784c855071435d3d36a3093a1b9d0173ad
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_10.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:64396667e7dfd7d655e294dcfa30dcd748fc1c12297506b95803959b515c5fad
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-190000/rng_state_11.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:660bbe31a08d4aee4068c7121d5d620a014158af0d2a4d1cc2663ec0421118f7
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-190000/rng_state_12.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:1d2595bf2f907c6c67d8c52f554c2ef87bd0652cda66e18e4f38e12f5542ad7d
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-190000/rng_state_13.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:58f7b0bd0335f75afbca91a9b6d671b88927d7aacdb60eb5f65bd73eb6d09d43
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-190000/rng_state_14.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:d7047a3879e576c371ea965ffe320f7260c38679ec4753bfbb2b8ebdccb48fe4
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-190000/rng_state_15.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:d9e93fea78c45d8bb98c690c39d3578217586709d42e5e0ca498a43b1a20ce46
         | 
| 3 | 
            +
            size 15997
         | 
    	
        checkpoint-190000/rng_state_2.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:d0fec5848c88a36189261d72b94bfcd80a656025ea1c64c4b03115cff56dd740
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_3.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:948ffe1ccf6675fe9d5bc1dd31677fd8896ab3f25b4d932c4b341f9c3e1e0e79
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_4.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:b58749a1852b16a0e04d937454f0a5f183cc90602b8e4d9a4594fa6fe6e98dce
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_5.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:a77b814a44a20a062a6f31194bcf0e185c70a2cd55e5d4d194c4ca077df1720b
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_6.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6ec5da545cddb1de90232ca90a11112c313b31288f84c702d35899f75609b674
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_7.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:9b949d18e93316156b9007e66b96b40cc175796d768b8a06bd86c199f2042a44
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_8.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:dbb2332c4e76b5a93498dc260d85c3b6faa53a6aae68e0e72470fe0a5d47176a
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/rng_state_9.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:ec017754057f32b35067f87060290bc9dbe8fa2413ea86810d5c31936d35e521
         | 
| 3 | 
            +
            size 15984
         | 
    	
        checkpoint-190000/scheduler.pt
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6a3b5e0ba89828bae7276df782eea1006e3c1e5268b406c80f0108fda9bb265c
         | 
| 3 | 
            +
            size 1064
         | 
    	
        checkpoint-190000/trainer_state.json
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:9be732963295a858a7121431bf0c2abdbe5e34486212c29f61620b0cc54e1368
         | 
| 3 | 
            +
            size 29041053
         | 
    	
        checkpoint-190000/training_args.bin
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6e0067077bf7e704155ba205ddefb13770496e7ace5ccb257e2abe4bb8a4e496
         | 
| 3 | 
            +
            size 5944
         |