|
job: extension |
|
config: |
|
name: qwen_image_infinite_future_lora_v1 |
|
process: |
|
- type: ui_trainer |
|
training_folder: /home/featurize/ai-toolkit/output |
|
sqlite_db_path: /home/featurize/ai-toolkit/aitk_db.db |
|
device: cuda |
|
trigger_word: null |
|
performance_log_every: 10 |
|
network: |
|
type: lora |
|
linear: 16 |
|
linear_alpha: 16 |
|
conv: 16 |
|
conv_alpha: 16 |
|
lokr_full_rank: true |
|
lokr_factor: -1 |
|
network_kwargs: |
|
ignore_if_contains: [] |
|
save: |
|
dtype: bf16 |
|
save_every: 250 |
|
max_step_saves_to_keep: 4000 |
|
save_format: diffusers |
|
push_to_hub: false |
|
datasets: |
|
- folder_path: /home/featurize/ai-toolkit/datasets/mimi_AI_art_Infinite_future_landscape_images_captioned |
|
control_path: null |
|
mask_path: null |
|
mask_min_value: 0.1 |
|
default_caption: '' |
|
caption_ext: txt |
|
caption_dropout_rate: 0.05 |
|
cache_latents_to_disk: false |
|
is_reg: false |
|
network_weight: 1 |
|
resolution: |
|
- 512 |
|
- 768 |
|
- 1024 |
|
controls: [] |
|
shrink_video_to_frames: true |
|
num_frames: 1 |
|
do_i2v: true |
|
train: |
|
batch_size: 1 |
|
bypass_guidance_embedding: false |
|
steps: 30000 |
|
gradient_accumulation: 1 |
|
train_unet: true |
|
train_text_encoder: false |
|
gradient_checkpointing: true |
|
noise_scheduler: flowmatch |
|
optimizer: adamw8bit |
|
timestep_type: weighted |
|
content_or_style: balanced |
|
optimizer_params: |
|
weight_decay: 0.0001 |
|
unload_text_encoder: false |
|
cache_text_embeddings: true |
|
lr: 0.0001 |
|
ema_config: |
|
use_ema: false |
|
ema_decay: 0.99 |
|
skip_first_sample: false |
|
disable_sampling: false |
|
dtype: bf16 |
|
diff_output_preservation: false |
|
diff_output_preservation_multiplier: 1 |
|
diff_output_preservation_class: person |
|
model: |
|
name_or_path: Qwen/Qwen-Image |
|
quantize: true |
|
qtype: uint3|ostris/accuracy_recovery_adapters/qwen_image_torchao_uint3.safetensors |
|
quantize_te: true |
|
qtype_te: qfloat8 |
|
arch: qwen_image |
|
low_vram: true |
|
model_kwargs: {} |
|
sample: |
|
sampler: flowmatch |
|
sample_every: 250 |
|
width: 512 |
|
height: 1024 |
|
samples: |
|
- prompt: In the style of Infinite future landscape , This is a digitally created, |
|
hyper-realistic CGI image depicting a fantastical aerial view of a sprawling |
|
cityscape. The image showcases a massive, ancient stone arch bridge stretching |
|
across the foreground, with intricate, gothic-style spires and towers along |
|
its edges. Below the bridge, a vast, turquoise ocean with visible coral |
|
reefs and islands can be seen. The city itself is densely packed with tall, |
|
dark buildings and spires, creating a labyrinthine effect. The background |
|
features a vibrant blue sky filled with fluffy white clouds, with the sun |
|
shining brightly in the top right corner, casting dramatic shadows. The |
|
overall color palette is dominated by rich blues and greens, with contrasting |
|
dark stone textures. |
|
- prompt: In the style of Infinite future landscape , Sunlight filters through |
|
clouds onto a cherry blossom-filled meadow, where a blue-haired youth in |
|
an indigo coat stands by a vermilion bridge, holding a book as petals drift |
|
past his smile. The scene blends dynamic nature with human stillness, using |
|
pink, red and blue hues to create harmony, while symbolic elements like |
|
blossoms and books add depth. |
|
neg: '' |
|
seed: 42 |
|
walk_seed: true |
|
guidance_scale: 4 |
|
sample_steps: 25 |
|
num_frames: 1 |
|
fps: 1 |
|
meta: |
|
name: qwen_image_infinite_future_lora_v1 |
|
version: '1.0' |
|
|