|
|
|
output_dir = '/root/diffusion-pipe/output/goya_drawings_qwen' |
|
dataset = '/root/diffusion-pipe/my_configs/dataset.toml' |
|
|
|
|
|
epochs = 1000 |
|
micro_batch_size_per_gpu = 4 |
|
pipeline_stages = 1 |
|
gradient_accumulation_steps = 1 |
|
gradient_clipping = 1 |
|
|
|
|
|
|
|
eval_every_n_epochs = 1 |
|
|
|
eval_before_first_step = true |
|
eval_micro_batch_size_per_gpu = 1 |
|
eval_gradient_accumulation_steps = 1 |
|
|
|
|
|
save_every_n_epochs = 500 |
|
save_every_n_steps = 250 |
|
|
|
checkpoint_every_n_minutes = 30 |
|
activation_checkpointing = 'unsloth' |
|
partition_method = 'parameters' |
|
save_dtype = 'bfloat16' |
|
caching_batch_size = 8 |
|
steps_per_print = 1 |
|
|
|
|
|
[model] |
|
type = 'qwen_image' |
|
|
|
diffusers_path = '/root/diffusion-pipe/imagegen_models/wan/Qwen-Image' |
|
dtype = 'bfloat16' |
|
|
|
timestep_sample_method = 'logit_normal' |
|
|
|
[adapter] |
|
type = 'lora' |
|
rank = 32 |
|
dtype = 'bfloat16' |
|
|
|
|
|
|
|
[optimizer] |
|
type = 'automagic' |
|
weight_decay = 0.01 |
|
|
|
|
|
|
|
|
|
|
|
|