JacobYuan commited on
Commit
eb2a505
·
verified ·
1 Parent(s): 9b45d8c

Upload folder using huggingface_hub

Browse files
1B/stage-1-image/args.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "batch_size": 20,
3
+ "accum_iter": 1,
4
+ "epochs": 100,
5
+ "warmup_epochs": 0.0025,
6
+ "lr": 5e-05,
7
+ "min_lr": 5e-05,
8
+ "wd": 0.1,
9
+ "clip_grad": 4.0,
10
+ "init_from": "",
11
+ "data_config": "",
12
+ "cache_ann_on_disk": false,
13
+ "length_clustering": true,
14
+ "num_workers": 64,
15
+ "pin_mem": true,
16
+ "seed": 0,
17
+ "output_dir": "",
18
+ "save_interval": 1,
19
+ "save_iteration_interval": 3000,
20
+ "only_save_trainable": false,
21
+ "ckpt_max_keep": 20,
22
+ "auto_resume": true,
23
+ "resume_path": null,
24
+ "model_parallel_size": 1,
25
+ "data_parallel": "fsdp",
26
+ "precision": "bf16",
27
+ "grad_precision": "fp32",
28
+ "checkpointing": true,
29
+ "max_seq_len": 32768,
30
+ "mask_image_logits": false,
31
+ "dropout": 0.0,
32
+ "z_loss_weight": 0.0,
33
+ "model_size": "1B_MMRoPE",
34
+ "pretrain_task": [
35
+ "predict_video"
36
+ ],
37
+ "video_fps": [
38
+ 1
39
+ ],
40
+ "video_duration": [
41
+ 1
42
+ ],
43
+ "cfg_mode": [
44
+ "text_only"
45
+ ],
46
+ "masking_mode": [
47
+ "text_to_video"
48
+ ],
49
+ "text_to_video_prob": 0.5,
50
+ "eval_data_config": "",
51
+ "run_eval": true,
52
+ "eval_in_epoch": 200,
53
+ "eval_mode": [
54
+ "text_to_video"
55
+ ],
56
+ "data_video_fps": 1,
57
+ "data_video_frames": 1,
58
+ "MaskedAR": true,
59
+ "mask_schedule": "cosine",
60
+ "min_masking_rate": 0.7,
61
+ "mask_contiguous_region_prob": null,
62
+ "noise_type": "mask",
63
+ "predict_all_tokens": false,
64
+ "frame_closs_recorder": true,
65
+ "mask_type": "tube",
66
+ "train_loss": "CEChunked",
67
+ "decay_start_coef": 1.0,
68
+ "compute_ntp_loss": false,
69
+ "train_with_slim_lm_head": false,
70
+ "train_with_vis_tok": true,
71
+ "vis_tok_start": 65536,
72
+ "visual_tokenizer": "Cosmos-Tokenizer-DV4x8x8",
73
+ "vocab_size": 129536,
74
+ "joint_img_video": false,
75
+ "img_batch_size": 8,
76
+ "img_data_config": null,
77
+ "video_iter_per_img_iter": 4,
78
+ "no_resume_metric_logger": true,
79
+ "world_size": 32,
80
+ "rank": 0,
81
+ "gpu": 0,
82
+ "local_rank": 0,
83
+ "dist_url": "env://",
84
+ "distributed": true,
85
+ "dist_backend": "nccl"
86
+ }
1B/stage-1-image/config.json ADDED
The diff for this file is too large to render. See raw diff
 
1B/stage-1-image/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f22eee519cd70ee3ee7a09979b7dc19af9dedf47c0f2711d43c3591fd3b2548
3
+ size 3007483424