TheMindExpansionNetwork commited on
Commit
4ecefab
·
verified ·
1 Parent(s): 363193d

Upload folder using huggingface_hub

Browse files
Files changed (35) hide show
  1. .job_config.json +125 -0
  2. config.yaml +109 -0
  3. log.txt +0 -0
  4. mindexpander_qwen_v1.safetensors +3 -0
  5. mindexpander_qwen_v1_000002000.safetensors +3 -0
  6. mindexpander_qwen_v1_000002250.safetensors +3 -0
  7. mindexpander_qwen_v1_000002500.safetensors +3 -0
  8. mindexpander_qwen_v1_000002750.safetensors +3 -0
  9. optimizer.pt +3 -0
  10. samples/1756522561350__000000000_0.jpg +0 -0
  11. samples/1756522647874__000000000_1.jpg +0 -0
  12. samples/1756523778796__000000250_0.jpg +0 -0
  13. samples/1756523866738__000000250_1.jpg +0 -0
  14. samples/1756524984321__000000500_0.jpg +0 -0
  15. samples/1756525072177__000000500_1.jpg +0 -0
  16. samples/1756526196791__000000750_0.jpg +0 -0
  17. samples/1756526284802__000000750_1.jpg +0 -0
  18. samples/1756527402735__000001000_0.jpg +0 -0
  19. samples/1756527490909__000001000_1.jpg +0 -0
  20. samples/1756528617469__000001250_0.jpg +0 -0
  21. samples/1756528705180__000001250_1.jpg +0 -0
  22. samples/1756529830083__000001500_0.jpg +0 -0
  23. samples/1756529917895__000001500_1.jpg +0 -0
  24. samples/1756531039898__000001750_0.jpg +0 -0
  25. samples/1756531127847__000001750_1.jpg +0 -0
  26. samples/1756532257016__000002000_0.jpg +0 -0
  27. samples/1756532345158__000002000_1.jpg +0 -0
  28. samples/1756533465237__000002250_0.jpg +0 -0
  29. samples/1756533553459__000002250_1.jpg +0 -0
  30. samples/1756534673904__000002500_0.jpg +0 -0
  31. samples/1756534761520__000002500_1.jpg +0 -0
  32. samples/1756535885683__000002750_0.jpg +0 -0
  33. samples/1756535972823__000002750_1.jpg +0 -0
  34. samples/1756537061569__000003000_0.jpg +0 -0
  35. samples/1756537148854__000003000_1.jpg +0 -0
.job_config.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "job": "extension",
3
+ "config": {
4
+ "name": "mindexpander_qwen_v1",
5
+ "process": [
6
+ {
7
+ "type": "ui_trainer",
8
+ "training_folder": "/app/ai-toolkit/output",
9
+ "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
10
+ "device": "cuda",
11
+ "trigger_word": null,
12
+ "performance_log_every": 10,
13
+ "network": {
14
+ "type": "lora",
15
+ "linear": 32,
16
+ "linear_alpha": 32,
17
+ "conv": 16,
18
+ "conv_alpha": 16,
19
+ "lokr_full_rank": true,
20
+ "lokr_factor": -1,
21
+ "network_kwargs": {
22
+ "ignore_if_contains": []
23
+ }
24
+ },
25
+ "save": {
26
+ "dtype": "bf16",
27
+ "save_every": 250,
28
+ "max_step_saves_to_keep": 4,
29
+ "save_format": "diffusers",
30
+ "push_to_hub": false
31
+ },
32
+ "datasets": [
33
+ {
34
+ "folder_path": "/app/ai-toolkit/datasets/mind",
35
+ "control_path": null,
36
+ "mask_path": null,
37
+ "mask_min_value": 0.1,
38
+ "default_caption": "",
39
+ "caption_ext": "txt",
40
+ "caption_dropout_rate": 0.05,
41
+ "cache_latents_to_disk": false,
42
+ "is_reg": false,
43
+ "network_weight": 1,
44
+ "resolution": [
45
+ 512,
46
+ 768,
47
+ 1024
48
+ ],
49
+ "controls": [],
50
+ "shrink_video_to_frames": true,
51
+ "num_frames": 1,
52
+ "do_i2v": true,
53
+ "flip_x": false,
54
+ "flip_y": false
55
+ }
56
+ ],
57
+ "train": {
58
+ "batch_size": 1,
59
+ "bypass_guidance_embedding": false,
60
+ "steps": 3000,
61
+ "gradient_accumulation": 1,
62
+ "train_unet": true,
63
+ "train_text_encoder": false,
64
+ "gradient_checkpointing": true,
65
+ "noise_scheduler": "flowmatch",
66
+ "optimizer": "adamw8bit",
67
+ "timestep_type": "weighted",
68
+ "content_or_style": "balanced",
69
+ "optimizer_params": {
70
+ "weight_decay": 0.0001
71
+ },
72
+ "unload_text_encoder": false,
73
+ "cache_text_embeddings": false,
74
+ "lr": 0.0001,
75
+ "ema_config": {
76
+ "use_ema": false,
77
+ "ema_decay": 0.99
78
+ },
79
+ "skip_first_sample": false,
80
+ "disable_sampling": false,
81
+ "dtype": "bf16",
82
+ "diff_output_preservation": false,
83
+ "diff_output_preservation_multiplier": 1,
84
+ "diff_output_preservation_class": "person",
85
+ "switch_boundary_every": 1
86
+ },
87
+ "model": {
88
+ "name_or_path": "Qwen/Qwen-Image",
89
+ "quantize": true,
90
+ "qtype": "qfloat8",
91
+ "quantize_te": true,
92
+ "qtype_te": "qfloat8",
93
+ "arch": "qwen_image",
94
+ "low_vram": true,
95
+ "model_kwargs": {}
96
+ },
97
+ "sample": {
98
+ "sampler": "flowmatch",
99
+ "sample_every": 250,
100
+ "width": 1024,
101
+ "height": 1024,
102
+ "samples": [
103
+ {
104
+ "prompt": "photorealistic portrait of a person wearing the m1nd3xpand3r mask (third-eye symbol, orange/blue markings) seated on a dim night metro; neon city lights streak outside the window at camera-left; shallow depth of field, 35mm lens, soft fluorescent flicker, window reflections; calm, moody, cinematic lighting; sharp focus, high detail, filmic color grade"
105
+ },
106
+ {
107
+ "prompt": "photorealistic close-up of a person wearing the m1nd3xpand3r mask in a narrow neon-lit alley at night; light rain with beads and drips on the mask; shallow depth of field, 50mm lens; slow cinematic vibe, cool neon rimlight with warm shop-sign fill; steam and puddle reflections; sharp focus, high detail, cinematic contrast"
108
+ }
109
+ ],
110
+ "neg": "",
111
+ "seed": 42,
112
+ "walk_seed": true,
113
+ "guidance_scale": 4,
114
+ "sample_steps": 25,
115
+ "num_frames": 1,
116
+ "fps": 1
117
+ }
118
+ }
119
+ ]
120
+ },
121
+ "meta": {
122
+ "name": "[name]",
123
+ "version": "1.0"
124
+ }
125
+ }
config.yaml ADDED
@@ -0,0 +1,109 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ job: extension
2
+ config:
3
+ name: mindexpander_qwen_v1
4
+ process:
5
+ - type: ui_trainer
6
+ training_folder: /app/ai-toolkit/output
7
+ sqlite_db_path: /app/ai-toolkit/aitk_db.db
8
+ device: cuda
9
+ trigger_word: null
10
+ performance_log_every: 10
11
+ network:
12
+ type: lora
13
+ linear: 32
14
+ linear_alpha: 32
15
+ conv: 16
16
+ conv_alpha: 16
17
+ lokr_full_rank: true
18
+ lokr_factor: -1
19
+ network_kwargs:
20
+ ignore_if_contains: []
21
+ save:
22
+ dtype: bf16
23
+ save_every: 250
24
+ max_step_saves_to_keep: 4
25
+ save_format: diffusers
26
+ push_to_hub: false
27
+ datasets:
28
+ - folder_path: /app/ai-toolkit/datasets/mind
29
+ control_path: null
30
+ mask_path: null
31
+ mask_min_value: 0.1
32
+ default_caption: ''
33
+ caption_ext: txt
34
+ caption_dropout_rate: 0.05
35
+ cache_latents_to_disk: false
36
+ is_reg: false
37
+ network_weight: 1
38
+ resolution:
39
+ - 512
40
+ - 768
41
+ - 1024
42
+ controls: []
43
+ shrink_video_to_frames: true
44
+ num_frames: 1
45
+ do_i2v: true
46
+ flip_x: false
47
+ flip_y: false
48
+ train:
49
+ batch_size: 1
50
+ bypass_guidance_embedding: false
51
+ steps: 3000
52
+ gradient_accumulation: 1
53
+ train_unet: true
54
+ train_text_encoder: false
55
+ gradient_checkpointing: true
56
+ noise_scheduler: flowmatch
57
+ optimizer: adamw8bit
58
+ timestep_type: weighted
59
+ content_or_style: balanced
60
+ optimizer_params:
61
+ weight_decay: 0.0001
62
+ unload_text_encoder: false
63
+ cache_text_embeddings: false
64
+ lr: 0.0001
65
+ ema_config:
66
+ use_ema: false
67
+ ema_decay: 0.99
68
+ skip_first_sample: false
69
+ disable_sampling: false
70
+ dtype: bf16
71
+ diff_output_preservation: false
72
+ diff_output_preservation_multiplier: 1
73
+ diff_output_preservation_class: person
74
+ switch_boundary_every: 1
75
+ model:
76
+ name_or_path: Qwen/Qwen-Image
77
+ quantize: true
78
+ qtype: qfloat8
79
+ quantize_te: true
80
+ qtype_te: qfloat8
81
+ arch: qwen_image
82
+ low_vram: true
83
+ model_kwargs: {}
84
+ sample:
85
+ sampler: flowmatch
86
+ sample_every: 250
87
+ width: 1024
88
+ height: 1024
89
+ samples:
90
+ - prompt: photorealistic portrait of a person wearing the m1nd3xpand3r mask
91
+ (third-eye symbol, orange/blue markings) seated on a dim night metro; neon
92
+ city lights streak outside the window at camera-left; shallow depth of field,
93
+ 35mm lens, soft fluorescent flicker, window reflections; calm, moody, cinematic
94
+ lighting; sharp focus, high detail, filmic color grade
95
+ - prompt: photorealistic close-up of a person wearing the m1nd3xpand3r mask
96
+ in a narrow neon-lit alley at night; light rain with beads and drips on
97
+ the mask; shallow depth of field, 50mm lens; slow cinematic vibe, cool neon
98
+ rimlight with warm shop-sign fill; steam and puddle reflections; sharp focus,
99
+ high detail, cinematic contrast
100
+ neg: ''
101
+ seed: 42
102
+ walk_seed: true
103
+ guidance_scale: 4
104
+ sample_steps: 25
105
+ num_frames: 1
106
+ fps: 1
107
+ meta:
108
+ name: mindexpander_qwen_v1
109
+ version: '1.0'
log.txt ADDED
The diff for this file is too large to render. See raw diff
 
mindexpander_qwen_v1.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4229098347ae62a92cbffdea8d06250891efd2e1b89b544412ba9b4dca7afe3
3
+ size 590058840
mindexpander_qwen_v1_000002000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8414dbc143c30e75c144afab0d98f60a8f2e3c1dc9d7a96b1bf40955b9919047
3
+ size 590058840
mindexpander_qwen_v1_000002250.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36792ae9a4c976a00f89917a1a59e8270edece1947e78a89536543c0ade4745f
3
+ size 590058840
mindexpander_qwen_v1_000002500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2588ef9bfd9270a89dd1d75243e4737e59710b7658c0da7c93145a23cea1707c
3
+ size 590058840
mindexpander_qwen_v1_000002750.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d8b3a5075723ea52dfd1823cc527a647892a5c1ce0b55766e45284ba3bc85d7
3
+ size 590058840
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f615183e2a2f3b5b4c357361b40663cba51867ba2793b1d3611c79b8ff321bd8
3
+ size 598613389
samples/1756522561350__000000000_0.jpg ADDED
samples/1756522647874__000000000_1.jpg ADDED
samples/1756523778796__000000250_0.jpg ADDED
samples/1756523866738__000000250_1.jpg ADDED
samples/1756524984321__000000500_0.jpg ADDED
samples/1756525072177__000000500_1.jpg ADDED
samples/1756526196791__000000750_0.jpg ADDED
samples/1756526284802__000000750_1.jpg ADDED
samples/1756527402735__000001000_0.jpg ADDED
samples/1756527490909__000001000_1.jpg ADDED
samples/1756528617469__000001250_0.jpg ADDED
samples/1756528705180__000001250_1.jpg ADDED
samples/1756529830083__000001500_0.jpg ADDED
samples/1756529917895__000001500_1.jpg ADDED
samples/1756531039898__000001750_0.jpg ADDED
samples/1756531127847__000001750_1.jpg ADDED
samples/1756532257016__000002000_0.jpg ADDED
samples/1756532345158__000002000_1.jpg ADDED
samples/1756533465237__000002250_0.jpg ADDED
samples/1756533553459__000002250_1.jpg ADDED
samples/1756534673904__000002500_0.jpg ADDED
samples/1756534761520__000002500_1.jpg ADDED
samples/1756535885683__000002750_0.jpg ADDED
samples/1756535972823__000002750_1.jpg ADDED
samples/1756537061569__000003000_0.jpg ADDED
samples/1756537148854__000003000_1.jpg ADDED