Mirmix commited on
Commit
4ca6e56
·
verified ·
1 Parent(s): 291abc3

End of training

Browse files
Files changed (48) hide show
  1. README.md +39 -0
  2. checkpoint-1000/model.safetensors +3 -0
  3. checkpoint-1000/optimizer.bin +3 -0
  4. checkpoint-1000/random_states_0.pkl +3 -0
  5. checkpoint-1000/scheduler.bin +3 -0
  6. checkpoint-1500/model.safetensors +3 -0
  7. checkpoint-1500/optimizer.bin +3 -0
  8. checkpoint-1500/random_states_0.pkl +3 -0
  9. checkpoint-1500/scheduler.bin +3 -0
  10. checkpoint-2000/model.safetensors +3 -0
  11. checkpoint-2000/optimizer.bin +3 -0
  12. checkpoint-2000/random_states_0.pkl +3 -0
  13. checkpoint-2000/scheduler.bin +3 -0
  14. checkpoint-2500/model.safetensors +3 -0
  15. checkpoint-2500/optimizer.bin +3 -0
  16. checkpoint-2500/random_states_0.pkl +3 -0
  17. checkpoint-2500/scheduler.bin +3 -0
  18. checkpoint-3000/model.safetensors +3 -0
  19. checkpoint-3000/optimizer.bin +3 -0
  20. checkpoint-3000/random_states_0.pkl +3 -0
  21. checkpoint-3000/scheduler.bin +3 -0
  22. checkpoint-500/model.safetensors +3 -0
  23. checkpoint-500/optimizer.bin +3 -0
  24. checkpoint-500/random_states_0.pkl +3 -0
  25. checkpoint-500/scheduler.bin +3 -0
  26. feature_extractor/preprocessor_config.json +27 -0
  27. learned_embeds-steps-1000.safetensors +3 -0
  28. learned_embeds-steps-1500.safetensors +3 -0
  29. learned_embeds-steps-2000.safetensors +3 -0
  30. learned_embeds-steps-2500.safetensors +3 -0
  31. learned_embeds-steps-3000.safetensors +3 -0
  32. learned_embeds-steps-500.safetensors +3 -0
  33. learned_embeds.safetensors +3 -0
  34. model_index.json +38 -0
  35. safety_checker/config.json +46 -0
  36. safety_checker/model.safetensors +3 -0
  37. scheduler/scheduler_config.json +15 -0
  38. text_encoder/config.json +24 -0
  39. text_encoder/model.safetensors +3 -0
  40. tokenizer/added_tokens.json +42 -0
  41. tokenizer/merges.txt +0 -0
  42. tokenizer/special_tokens_map.json +24 -0
  43. tokenizer/tokenizer_config.json +351 -0
  44. tokenizer/vocab.json +0 -0
  45. unet/config.json +68 -0
  46. unet/diffusion_pytorch_model.safetensors +3 -0
  47. vae/config.json +38 -0
  48. vae/diffusion_pytorch_model.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: stable-diffusion-v1-5/stable-diffusion-v1-5
3
+ library_name: diffusers
4
+ license: creativeml-openrail-m
5
+ inference: true
6
+ tags:
7
+ - stable-diffusion
8
+ - stable-diffusion-diffusers
9
+ - text-to-image
10
+ - diffusers
11
+ - textual_inversion
12
+ - diffusers-training
13
+ ---
14
+
15
+ <!-- This model card has been generated automatically according to the information the training script had access to. You
16
+ should probably proofread and complete it, then remove this comment. -->
17
+
18
+
19
+ # Textual inversion text2image fine-tuning - Mirmix/textual_inversion_scan24_full_40tokens
20
+ These are textual inversion adaption weights for stable-diffusion-v1-5/stable-diffusion-v1-5. You can find some example images in the following.
21
+
22
+
23
+
24
+
25
+ ## Intended uses & limitations
26
+
27
+ #### How to use
28
+
29
+ ```python
30
+ # TODO: add an example code snippet for running this diffusion pipeline
31
+ ```
32
+
33
+ #### Limitations and bias
34
+
35
+ [TODO: provide examples of latent issues and potential remediations]
36
+
37
+ ## Training details
38
+
39
+ [TODO: describe the data used to train the model]
checkpoint-1000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89d4f9d57a15b63f0247f0f368d7a932a9c12a333d1261ed8b48553534ffc998
3
+ size 492388048
checkpoint-1000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d05297f475a17c507c45e1848b33a0e73840ab93853fbde40f713d5cf2f353ea
3
+ size 303810995
checkpoint-1000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d01c6f948e46f70b92e5f6798f4e5de10a49310c8165960583c1706feeabd6a1
3
+ size 14757
checkpoint-1000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0141b8816d005ab0155e12076591b358b17b434b820ffd19fcb751fd3577ab0
3
+ size 1401
checkpoint-1500/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a84f73ad091141fd1d1a2d46d52caee77cb0e15f11b418201075afff194b5708
3
+ size 492388048
checkpoint-1500/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:690d9be179623462c0357901ef2e4783476fefbad442ea10b4b52eec1b429d2a
3
+ size 303810995
checkpoint-1500/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9e40c0946e89bcac2042f25ed88283d708457cc85ab8e6ccfb8e606d8d99d5a
3
+ size 14821
checkpoint-1500/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f6de1f1aad4955373863105fea43996909135ab11a05f69f664002caa7f655
3
+ size 1401
checkpoint-2000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:743b2c92cc3e4bf324143f3f4f6cfe5cfc3b649b2cf422ba9b79c18720ed0a49
3
+ size 492388048
checkpoint-2000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:813b00a494fdad93f71a88ddd1f329c2a3523b4f2e6219033f1d20ff2574ff9f
3
+ size 303810995
checkpoint-2000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b125e118cb2d0e666683296148257b5aa4ddc285a60fcfb85086c44631fe1bcb
3
+ size 14821
checkpoint-2000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db8705e68e3f5d10b2093eb04409445a51eaa0fa537855f68bbff49f7ba03b3f
3
+ size 1401
checkpoint-2500/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcead55571721cfbdaa3b74278f3a004d34e650d99914ceb2ce272f59fde23e8
3
+ size 492388048
checkpoint-2500/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff73eacb58ca0329262a196e46c71690f2a4f447f997defe3e9131dc3c51d4fd
3
+ size 303810995
checkpoint-2500/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a402eefc26a466e09b970cad0b1d0030dc4ea604a2f0e72bc7148d2b7ba7020
3
+ size 14821
checkpoint-2500/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:328b872afc2dde919bcdc05a2f15ee9a6c2c722dc09e791a74e330c511dff2d7
3
+ size 1401
checkpoint-3000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09527ffaeae0d91cd349cd1d048cb9b483a6caaa4eaf9f9865d1f348d00da4e1
3
+ size 492388048
checkpoint-3000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae9e002f0d4d1d2c808d4f041b8cb4a47d954a3bb9706d282614e21c509571fe
3
+ size 303810995
checkpoint-3000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c97f033955c7b4097886ca26ee6a72d8ddd6f530d1e3817d79454570eca28f3
3
+ size 14821
checkpoint-3000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f598def469aca44a1bf0b4394561a0be098ee257cabc03a28986894010b3775
3
+ size 1401
checkpoint-500/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4787541f83b8304f6f60b1fe055ff36e7f464f49d2b446cf61ab1ed210064800
3
+ size 492388048
checkpoint-500/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a95d8c1d129fc2ceb9604943b383107417b81c489c4bdfb5ed5134913724541
3
+ size 303810995
checkpoint-500/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0d4159ab81268837d746cd19f1ce830948007d67edde471bd7997d10ea95ae6
3
+ size 14757
checkpoint-500/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee04579db6cf5d822fbf73f3441ac1670faf4a79ec5c320d39b5a697e8102112
3
+ size 1401
feature_extractor/preprocessor_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "image_processor_type": "CLIPImageProcessor",
17
+ "image_std": [
18
+ 0.26862954,
19
+ 0.26130258,
20
+ 0.27577711
21
+ ],
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "shortest_edge": 224
26
+ }
27
+ }
learned_embeds-steps-1000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:178ada9a8239f3f05cc252ca921ca4bd7ac15ff8b6014d3d2e2e07e72951c46f
3
+ size 123000
learned_embeds-steps-1500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c921a92258340e4b78642ccfa2939fc7dd3b071974422bf9eca34a571df23ae0
3
+ size 123000
learned_embeds-steps-2000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd4196a49c188d5d4daca70795c0ed1b3fea63cc35e36c07c2fe3485137cffc2
3
+ size 123000
learned_embeds-steps-2500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a7231309834e25d2c5a043ece7adf27301741bae94bbb4b7de371ab3037e9a2
3
+ size 123000
learned_embeds-steps-3000.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:436dd58216cdf56e9d99a25c029ee08874c544765dd10d538fc63a480625f651
3
+ size 123000
learned_embeds-steps-500.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aa83d73773ee02f160b707e206f4d0fa7f86ff58cfa5127cf192143f3189f44
3
+ size 123000
learned_embeds.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:436dd58216cdf56e9d99a25c029ee08874c544765dd10d538fc63a480625f651
3
+ size 123000
model_index.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "StableDiffusionPipeline",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "_name_or_path": "stable-diffusion-v1-5/stable-diffusion-v1-5",
5
+ "feature_extractor": [
6
+ "transformers",
7
+ "CLIPImageProcessor"
8
+ ],
9
+ "image_encoder": [
10
+ null,
11
+ null
12
+ ],
13
+ "requires_safety_checker": true,
14
+ "safety_checker": [
15
+ "stable_diffusion",
16
+ "StableDiffusionSafetyChecker"
17
+ ],
18
+ "scheduler": [
19
+ "diffusers",
20
+ "PNDMScheduler"
21
+ ],
22
+ "text_encoder": [
23
+ "transformers",
24
+ "CLIPTextModel"
25
+ ],
26
+ "tokenizer": [
27
+ "transformers",
28
+ "CLIPTokenizer"
29
+ ],
30
+ "unet": [
31
+ "diffusers",
32
+ "UNet2DConditionModel"
33
+ ],
34
+ "vae": [
35
+ "diffusers",
36
+ "AutoencoderKL"
37
+ ]
38
+ }
safety_checker/config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "StableDiffusionSafetyChecker"
4
+ ],
5
+ "initializer_factor": 1.0,
6
+ "logit_scale_init_value": 2.6592,
7
+ "model_type": "clip",
8
+ "projection_dim": 768,
9
+ "text_config": {
10
+ "attention_dropout": 0.0,
11
+ "dropout": 0.0,
12
+ "hidden_act": "quick_gelu",
13
+ "hidden_size": 768,
14
+ "initializer_factor": 1.0,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 3072,
17
+ "layer_norm_eps": 1e-05,
18
+ "max_position_embeddings": 77,
19
+ "model_type": "clip_text_model",
20
+ "num_attention_heads": 12,
21
+ "num_hidden_layers": 12,
22
+ "projection_dim": 512,
23
+ "torch_dtype": "float32",
24
+ "vocab_size": 49408
25
+ },
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.52.3",
28
+ "vision_config": {
29
+ "attention_dropout": 0.0,
30
+ "dropout": 0.0,
31
+ "hidden_act": "quick_gelu",
32
+ "hidden_size": 1024,
33
+ "image_size": 224,
34
+ "initializer_factor": 1.0,
35
+ "initializer_range": 0.02,
36
+ "intermediate_size": 4096,
37
+ "layer_norm_eps": 1e-05,
38
+ "model_type": "clip_vision_model",
39
+ "num_attention_heads": 16,
40
+ "num_channels": 3,
41
+ "num_hidden_layers": 24,
42
+ "patch_size": 14,
43
+ "projection_dim": 512,
44
+ "torch_dtype": "float32"
45
+ }
46
+ }
safety_checker/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb351a5ded815c3ff744968ad9c6b218d071b9d313d04f35e813b84b4c0ffde8
3
+ size 1215979664
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "PNDMScheduler",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "beta_end": 0.012,
5
+ "beta_schedule": "scaled_linear",
6
+ "beta_start": 0.00085,
7
+ "clip_sample": false,
8
+ "num_train_timesteps": 1000,
9
+ "prediction_type": "epsilon",
10
+ "set_alpha_to_one": false,
11
+ "skip_prk_steps": true,
12
+ "steps_offset": 1,
13
+ "timestep_spacing": "leading",
14
+ "trained_betas": null
15
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModel"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "quick_gelu",
10
+ "hidden_size": 768,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.52.3",
23
+ "vocab_size": 49448
24
+ }
text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09527ffaeae0d91cd349cd1d048cb9b483a6caaa4eaf9f9865d1f348d00da4e1
3
+ size 492388048
tokenizer/added_tokens.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<scan24-building>": 49408,
3
+ "<scan24-building>_1": 49409,
4
+ "<scan24-building>_10": 49418,
5
+ "<scan24-building>_11": 49419,
6
+ "<scan24-building>_12": 49420,
7
+ "<scan24-building>_13": 49421,
8
+ "<scan24-building>_14": 49422,
9
+ "<scan24-building>_15": 49423,
10
+ "<scan24-building>_16": 49424,
11
+ "<scan24-building>_17": 49425,
12
+ "<scan24-building>_18": 49426,
13
+ "<scan24-building>_19": 49427,
14
+ "<scan24-building>_2": 49410,
15
+ "<scan24-building>_20": 49428,
16
+ "<scan24-building>_21": 49429,
17
+ "<scan24-building>_22": 49430,
18
+ "<scan24-building>_23": 49431,
19
+ "<scan24-building>_24": 49432,
20
+ "<scan24-building>_25": 49433,
21
+ "<scan24-building>_26": 49434,
22
+ "<scan24-building>_27": 49435,
23
+ "<scan24-building>_28": 49436,
24
+ "<scan24-building>_29": 49437,
25
+ "<scan24-building>_3": 49411,
26
+ "<scan24-building>_30": 49438,
27
+ "<scan24-building>_31": 49439,
28
+ "<scan24-building>_32": 49440,
29
+ "<scan24-building>_33": 49441,
30
+ "<scan24-building>_34": 49442,
31
+ "<scan24-building>_35": 49443,
32
+ "<scan24-building>_36": 49444,
33
+ "<scan24-building>_37": 49445,
34
+ "<scan24-building>_38": 49446,
35
+ "<scan24-building>_39": 49447,
36
+ "<scan24-building>_4": 49412,
37
+ "<scan24-building>_5": 49413,
38
+ "<scan24-building>_6": 49414,
39
+ "<scan24-building>_7": 49415,
40
+ "<scan24-building>_8": 49416,
41
+ "<scan24-building>_9": 49417
42
+ }
tokenizer/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<|endoftext|>",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,351 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "49406": {
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "49407": {
13
+ "content": "<|endoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "49408": {
21
+ "content": "<scan24-building>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": false
27
+ },
28
+ "49409": {
29
+ "content": "<scan24-building>_1",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": false
35
+ },
36
+ "49410": {
37
+ "content": "<scan24-building>_2",
38
+ "lstrip": false,
39
+ "normalized": true,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": false
43
+ },
44
+ "49411": {
45
+ "content": "<scan24-building>_3",
46
+ "lstrip": false,
47
+ "normalized": true,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": false
51
+ },
52
+ "49412": {
53
+ "content": "<scan24-building>_4",
54
+ "lstrip": false,
55
+ "normalized": true,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": false
59
+ },
60
+ "49413": {
61
+ "content": "<scan24-building>_5",
62
+ "lstrip": false,
63
+ "normalized": true,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": false
67
+ },
68
+ "49414": {
69
+ "content": "<scan24-building>_6",
70
+ "lstrip": false,
71
+ "normalized": true,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": false
75
+ },
76
+ "49415": {
77
+ "content": "<scan24-building>_7",
78
+ "lstrip": false,
79
+ "normalized": true,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": false
83
+ },
84
+ "49416": {
85
+ "content": "<scan24-building>_8",
86
+ "lstrip": false,
87
+ "normalized": true,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": false
91
+ },
92
+ "49417": {
93
+ "content": "<scan24-building>_9",
94
+ "lstrip": false,
95
+ "normalized": true,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": false
99
+ },
100
+ "49418": {
101
+ "content": "<scan24-building>_10",
102
+ "lstrip": false,
103
+ "normalized": true,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": false
107
+ },
108
+ "49419": {
109
+ "content": "<scan24-building>_11",
110
+ "lstrip": false,
111
+ "normalized": true,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": false
115
+ },
116
+ "49420": {
117
+ "content": "<scan24-building>_12",
118
+ "lstrip": false,
119
+ "normalized": true,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": false
123
+ },
124
+ "49421": {
125
+ "content": "<scan24-building>_13",
126
+ "lstrip": false,
127
+ "normalized": true,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": false
131
+ },
132
+ "49422": {
133
+ "content": "<scan24-building>_14",
134
+ "lstrip": false,
135
+ "normalized": true,
136
+ "rstrip": false,
137
+ "single_word": false,
138
+ "special": false
139
+ },
140
+ "49423": {
141
+ "content": "<scan24-building>_15",
142
+ "lstrip": false,
143
+ "normalized": true,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": false
147
+ },
148
+ "49424": {
149
+ "content": "<scan24-building>_16",
150
+ "lstrip": false,
151
+ "normalized": true,
152
+ "rstrip": false,
153
+ "single_word": false,
154
+ "special": false
155
+ },
156
+ "49425": {
157
+ "content": "<scan24-building>_17",
158
+ "lstrip": false,
159
+ "normalized": true,
160
+ "rstrip": false,
161
+ "single_word": false,
162
+ "special": false
163
+ },
164
+ "49426": {
165
+ "content": "<scan24-building>_18",
166
+ "lstrip": false,
167
+ "normalized": true,
168
+ "rstrip": false,
169
+ "single_word": false,
170
+ "special": false
171
+ },
172
+ "49427": {
173
+ "content": "<scan24-building>_19",
174
+ "lstrip": false,
175
+ "normalized": true,
176
+ "rstrip": false,
177
+ "single_word": false,
178
+ "special": false
179
+ },
180
+ "49428": {
181
+ "content": "<scan24-building>_20",
182
+ "lstrip": false,
183
+ "normalized": true,
184
+ "rstrip": false,
185
+ "single_word": false,
186
+ "special": false
187
+ },
188
+ "49429": {
189
+ "content": "<scan24-building>_21",
190
+ "lstrip": false,
191
+ "normalized": true,
192
+ "rstrip": false,
193
+ "single_word": false,
194
+ "special": false
195
+ },
196
+ "49430": {
197
+ "content": "<scan24-building>_22",
198
+ "lstrip": false,
199
+ "normalized": true,
200
+ "rstrip": false,
201
+ "single_word": false,
202
+ "special": false
203
+ },
204
+ "49431": {
205
+ "content": "<scan24-building>_23",
206
+ "lstrip": false,
207
+ "normalized": true,
208
+ "rstrip": false,
209
+ "single_word": false,
210
+ "special": false
211
+ },
212
+ "49432": {
213
+ "content": "<scan24-building>_24",
214
+ "lstrip": false,
215
+ "normalized": true,
216
+ "rstrip": false,
217
+ "single_word": false,
218
+ "special": false
219
+ },
220
+ "49433": {
221
+ "content": "<scan24-building>_25",
222
+ "lstrip": false,
223
+ "normalized": true,
224
+ "rstrip": false,
225
+ "single_word": false,
226
+ "special": false
227
+ },
228
+ "49434": {
229
+ "content": "<scan24-building>_26",
230
+ "lstrip": false,
231
+ "normalized": true,
232
+ "rstrip": false,
233
+ "single_word": false,
234
+ "special": false
235
+ },
236
+ "49435": {
237
+ "content": "<scan24-building>_27",
238
+ "lstrip": false,
239
+ "normalized": true,
240
+ "rstrip": false,
241
+ "single_word": false,
242
+ "special": false
243
+ },
244
+ "49436": {
245
+ "content": "<scan24-building>_28",
246
+ "lstrip": false,
247
+ "normalized": true,
248
+ "rstrip": false,
249
+ "single_word": false,
250
+ "special": false
251
+ },
252
+ "49437": {
253
+ "content": "<scan24-building>_29",
254
+ "lstrip": false,
255
+ "normalized": true,
256
+ "rstrip": false,
257
+ "single_word": false,
258
+ "special": false
259
+ },
260
+ "49438": {
261
+ "content": "<scan24-building>_30",
262
+ "lstrip": false,
263
+ "normalized": true,
264
+ "rstrip": false,
265
+ "single_word": false,
266
+ "special": false
267
+ },
268
+ "49439": {
269
+ "content": "<scan24-building>_31",
270
+ "lstrip": false,
271
+ "normalized": true,
272
+ "rstrip": false,
273
+ "single_word": false,
274
+ "special": false
275
+ },
276
+ "49440": {
277
+ "content": "<scan24-building>_32",
278
+ "lstrip": false,
279
+ "normalized": true,
280
+ "rstrip": false,
281
+ "single_word": false,
282
+ "special": false
283
+ },
284
+ "49441": {
285
+ "content": "<scan24-building>_33",
286
+ "lstrip": false,
287
+ "normalized": true,
288
+ "rstrip": false,
289
+ "single_word": false,
290
+ "special": false
291
+ },
292
+ "49442": {
293
+ "content": "<scan24-building>_34",
294
+ "lstrip": false,
295
+ "normalized": true,
296
+ "rstrip": false,
297
+ "single_word": false,
298
+ "special": false
299
+ },
300
+ "49443": {
301
+ "content": "<scan24-building>_35",
302
+ "lstrip": false,
303
+ "normalized": true,
304
+ "rstrip": false,
305
+ "single_word": false,
306
+ "special": false
307
+ },
308
+ "49444": {
309
+ "content": "<scan24-building>_36",
310
+ "lstrip": false,
311
+ "normalized": true,
312
+ "rstrip": false,
313
+ "single_word": false,
314
+ "special": false
315
+ },
316
+ "49445": {
317
+ "content": "<scan24-building>_37",
318
+ "lstrip": false,
319
+ "normalized": true,
320
+ "rstrip": false,
321
+ "single_word": false,
322
+ "special": false
323
+ },
324
+ "49446": {
325
+ "content": "<scan24-building>_38",
326
+ "lstrip": false,
327
+ "normalized": true,
328
+ "rstrip": false,
329
+ "single_word": false,
330
+ "special": false
331
+ },
332
+ "49447": {
333
+ "content": "<scan24-building>_39",
334
+ "lstrip": false,
335
+ "normalized": true,
336
+ "rstrip": false,
337
+ "single_word": false,
338
+ "special": false
339
+ }
340
+ },
341
+ "bos_token": "<|startoftext|>",
342
+ "clean_up_tokenization_spaces": false,
343
+ "do_lower_case": true,
344
+ "eos_token": "<|endoftext|>",
345
+ "errors": "replace",
346
+ "extra_special_tokens": {},
347
+ "model_max_length": 77,
348
+ "pad_token": "<|endoftext|>",
349
+ "tokenizer_class": "CLIPTokenizer",
350
+ "unk_token": "<|endoftext|>"
351
+ }
tokenizer/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
unet/config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "_name_or_path": "stable-diffusion-v1-5/stable-diffusion-v1-5",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "attention_type": "default",
11
+ "block_out_channels": [
12
+ 320,
13
+ 640,
14
+ 1280,
15
+ 1280
16
+ ],
17
+ "center_input_sample": false,
18
+ "class_embed_type": null,
19
+ "class_embeddings_concat": false,
20
+ "conv_in_kernel": 3,
21
+ "conv_out_kernel": 3,
22
+ "cross_attention_dim": 768,
23
+ "cross_attention_norm": null,
24
+ "down_block_types": [
25
+ "CrossAttnDownBlock2D",
26
+ "CrossAttnDownBlock2D",
27
+ "CrossAttnDownBlock2D",
28
+ "DownBlock2D"
29
+ ],
30
+ "downsample_padding": 1,
31
+ "dropout": 0.0,
32
+ "dual_cross_attention": false,
33
+ "encoder_hid_dim": null,
34
+ "encoder_hid_dim_type": null,
35
+ "flip_sin_to_cos": true,
36
+ "freq_shift": 0,
37
+ "in_channels": 4,
38
+ "layers_per_block": 2,
39
+ "mid_block_only_cross_attention": null,
40
+ "mid_block_scale_factor": 1,
41
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
42
+ "norm_eps": 1e-05,
43
+ "norm_num_groups": 32,
44
+ "num_attention_heads": null,
45
+ "num_class_embeds": null,
46
+ "only_cross_attention": false,
47
+ "out_channels": 4,
48
+ "projection_class_embeddings_input_dim": null,
49
+ "resnet_out_scale_factor": 1.0,
50
+ "resnet_skip_time_act": false,
51
+ "resnet_time_scale_shift": "default",
52
+ "reverse_transformer_layers_per_block": null,
53
+ "sample_size": 64,
54
+ "time_cond_proj_dim": null,
55
+ "time_embedding_act_fn": null,
56
+ "time_embedding_dim": null,
57
+ "time_embedding_type": "positional",
58
+ "timestep_post_act": null,
59
+ "transformer_layers_per_block": 1,
60
+ "up_block_types": [
61
+ "UpBlock2D",
62
+ "CrossAttnUpBlock2D",
63
+ "CrossAttnUpBlock2D",
64
+ "CrossAttnUpBlock2D"
65
+ ],
66
+ "upcast_attention": false,
67
+ "use_linear_projection": false
68
+ }
unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d27cd69d4a0aa32105087a619f32a51bc087e133be93fe23da92f3c0bcc07d79
3
+ size 3438167536
vae/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "_name_or_path": "stable-diffusion-v1-5/stable-diffusion-v1-5",
5
+ "act_fn": "silu",
6
+ "block_out_channels": [
7
+ 128,
8
+ 256,
9
+ 512,
10
+ 512
11
+ ],
12
+ "down_block_types": [
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D",
16
+ "DownEncoderBlock2D"
17
+ ],
18
+ "force_upcast": true,
19
+ "in_channels": 3,
20
+ "latent_channels": 4,
21
+ "latents_mean": null,
22
+ "latents_std": null,
23
+ "layers_per_block": 2,
24
+ "mid_block_add_attention": true,
25
+ "norm_num_groups": 32,
26
+ "out_channels": 3,
27
+ "sample_size": 512,
28
+ "scaling_factor": 0.18215,
29
+ "shift_factor": null,
30
+ "up_block_types": [
31
+ "UpDecoderBlock2D",
32
+ "UpDecoderBlock2D",
33
+ "UpDecoderBlock2D",
34
+ "UpDecoderBlock2D"
35
+ ],
36
+ "use_post_quant_conv": true,
37
+ "use_quant_conv": true
38
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4d2b5932bb4151e54e694fd31ccf51fca908223c9485bd56cd0e1d83ad94c49
3
+ size 334643268