{ "output_dir": "exps", "exp_name": "sit-xl-1-dinov2-b-enc8-repae-invae-0.5-1.5-400k", "logging_dir": "logs", "report_to": "wandb", "sampling_steps": 10000, "resume_step": 0, "continue_train_exp_dir": null, "wandb_history_path": null, "model": "SiT-XL/1", "num_classes": 1000, "encoder_depth": 8, "qk_norm": false, "fused_attn": true, "bn_momentum": 0.1, "compile": true, "data_dir": "data", "resolution": 256, "batch_size": 256, "allow_tf32": true, "mixed_precision": "fp16", "epochs": 1400, "max_train_steps": 400000, "checkpointing_steps": 50000, "gradient_accumulation_steps": 1, "learning_rate": 0.0001, "adam_beta1": 0.9, "adam_beta2": 0.999, "adam_weight_decay": 0.0, "adam_epsilon": 1e-08, "max_grad_norm": 1.0, "seed": 0, "num_workers": 4, "path_type": "linear", "prediction": "v", "cfg_prob": 0.1, "enc_type": "dinov2-vit-b", "proj_coeff": 0.5, "weighting": "uniform", "vae": "f16d32", "vae_ckpt": "pretrained/invae-f16d32/invae-f16d32.pt", "disc_pretrained_ckpt": "pretrained/invae-f16d32/invae-f16d32-discriminator-ckpt.pt", "loss_cfg_path": "configs/l1_lpips_kl_gan.yaml", "vae_learning_rate": 0.0001, "disc_learning_rate": 0.0001, "vae_align_proj_coeff": 1.5 }