saddam213 commited on
Commit
4ab0607
·
verified ·
1 Parent(s): d46af0f

Initial Upload

Browse files
.gitattributes CHANGED
@@ -33,3 +33,10 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ controlnet/model.onnx.data filter=lfs diff=lfs merge=lfs -text
37
+ Icon.png filter=lfs diff=lfs merge=lfs -text
38
+ Sample.png filter=lfs diff=lfs merge=lfs -text
39
+ Sample2.png filter=lfs diff=lfs merge=lfs -text
40
+ Sample3.png filter=lfs diff=lfs merge=lfs -text
41
+ Sample4.png filter=lfs diff=lfs merge=lfs -text
42
+ unet/model.onnx.data filter=lfs diff=lfs merge=lfs -text
Icon.png ADDED

Git LFS Details

  • SHA256: cf3a14a1e970eb455b53a09217e49540c169ced2e7287f4a6261c6a51f6ca990
  • Pointer size: 132 Bytes
  • Size of remote file: 1.82 MB
README.md ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # iNiverse Mix XL v1.1 - Onnx Olive DirectML Optimized
2
+
3
+ ## Original Model
4
+ https://civitai.com/models/226533?modelVersionId=481914
5
+
6
+ ## C# Inference Demo
7
+ https://github.com/TensorStack-AI/OnnxStack
8
+
9
+ ```csharp
10
+ // Create Pipeline
11
+ var pipeline = StableDiffusionXLPipeline.CreatePipeline("D:\\Models\\iNiverseMix-XL-onnx");
12
+
13
+ // Prompt
14
+ var promptOptions = new PromptOptions
15
+ {
16
+ Prompt = "Illustrate a young woman reading a book in a library, surrounded by shelves filled with books"
17
+ };
18
+
19
+ // Run pipeline
20
+ var result = await pipeline.GenerateImageAsync(promptOptions);
21
+
22
+ // Save Image Result
23
+ await result.SaveAsync("Result.png");
24
+ ```
25
+ ## Inference Result
26
+ ![Intro Image](Sample.png)
Sample.png ADDED

Git LFS Details

  • SHA256: 2eebd67f821412163981dfd6b8f30a58845e6f3256128905a1ab783596e4c7b6
  • Pointer size: 132 Bytes
  • Size of remote file: 1.36 MB
Sample2.png ADDED

Git LFS Details

  • SHA256: 9200225fe2f2ac456ca8d59ee844b79983617d01b48fe1add0f58db06da7a2b7
  • Pointer size: 132 Bytes
  • Size of remote file: 1.91 MB
Sample3.png ADDED

Git LFS Details

  • SHA256: 0b7f77deb9ac0e9d0970d111ecee60593b4b84d712a528ef22436d8791b7105d
  • Pointer size: 132 Bytes
  • Size of remote file: 1.55 MB
Sample4.png ADDED

Git LFS Details

  • SHA256: e308cb2cd88aef3465f54ca8a6026f3407e66e2006070438f2de3e30806d9b5f
  • Pointer size: 132 Bytes
  • Size of remote file: 1.71 MB
controlnet/config.json ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.29.0.dev0",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
+ "attention_type": "default",
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "center_input_sample": false,
20
+ "class_embed_type": null,
21
+ "class_embeddings_concat": false,
22
+ "conv_in_kernel": 3,
23
+ "conv_out_kernel": 3,
24
+ "cross_attention_dim": 2048,
25
+ "cross_attention_norm": null,
26
+ "down_block_types": [
27
+ "DownBlock2D",
28
+ "CrossAttnDownBlock2D",
29
+ "CrossAttnDownBlock2D"
30
+ ],
31
+ "downsample_padding": 1,
32
+ "dropout": 0.0,
33
+ "dual_cross_attention": false,
34
+ "encoder_hid_dim": null,
35
+ "encoder_hid_dim_type": null,
36
+ "flip_sin_to_cos": true,
37
+ "freq_shift": 0,
38
+ "in_channels": 4,
39
+ "layers_per_block": 2,
40
+ "mid_block_only_cross_attention": null,
41
+ "mid_block_scale_factor": 1,
42
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "out_channels": 4,
49
+ "projection_class_embeddings_input_dim": 2816,
50
+ "resnet_out_scale_factor": 1.0,
51
+ "resnet_skip_time_act": false,
52
+ "resnet_time_scale_shift": "default",
53
+ "reverse_transformer_layers_per_block": null,
54
+ "sample_size": 128,
55
+ "time_cond_proj_dim": null,
56
+ "time_embedding_act_fn": null,
57
+ "time_embedding_dim": null,
58
+ "time_embedding_type": "positional",
59
+ "timestep_post_act": null,
60
+ "transformer_layers_per_block": [
61
+ 1,
62
+ 2,
63
+ 10
64
+ ],
65
+ "up_block_types": [
66
+ "CrossAttnUpBlock2D",
67
+ "CrossAttnUpBlock2D",
68
+ "UpBlock2D"
69
+ ],
70
+ "upcast_attention": null,
71
+ "use_linear_projection": true
72
+ }
controlnet/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57135821c1f621398c1641b43f4bc6058c6da0b70c438a7b7f87c452910b6b5d
3
+ size 1244445
controlnet/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d363ee8e221f8cb43449dea18f60b058e1f23117f24acef32ffd5f6c2c504b4
3
+ size 5134903040
model_index.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "StableDiffusionXLPipeline",
3
+ "_diffusers_version": "0.29.0.dev0",
4
+ "feature_extractor": [
5
+ null,
6
+ null
7
+ ],
8
+ "force_zeros_for_empty_prompt": true,
9
+ "image_encoder": [
10
+ null,
11
+ null
12
+ ],
13
+ "scheduler": [
14
+ "diffusers",
15
+ "EulerDiscreteScheduler"
16
+ ],
17
+ "text_encoder": [
18
+ "transformers",
19
+ "CLIPTextModel"
20
+ ],
21
+ "text_encoder_2": [
22
+ "transformers",
23
+ "CLIPTextModelWithProjection"
24
+ ],
25
+ "tokenizer": [
26
+ "transformers",
27
+ "CLIPTokenizer"
28
+ ],
29
+ "tokenizer_2": [
30
+ "transformers",
31
+ "CLIPTokenizer"
32
+ ],
33
+ "unet": [
34
+ "diffusers",
35
+ "UNet2DConditionModel"
36
+ ],
37
+ "vae": [
38
+ "diffusers",
39
+ "AutoencoderKL"
40
+ ]
41
+ }
model_template.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "Id": "A70F7EE5-E99E-4108-84D0-1590EA308DB3",
3
+ "FileVersion": "1",
4
+ "Created": "2024-06-016T00:00:00",
5
+ "Name": "iNiverse Mix XL",
6
+ "ImageIcon": "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/Icon.png",
7
+ "Author": "JinnGames",
8
+ "Description": "This model delivers highly realistic renderings, optimized for capturing the diverse appearances of Asian characters. It excels in producing detailed and varied styles from different countries, highlighting intricate features. For optimal visual quality, recommended resolutions are 768, 1024, and 1280.",
9
+ "Rank": 310,
10
+ "Group": "Online",
11
+ "Template": "SDXL",
12
+ "Category": "StableDiffusion",
13
+ "StableDiffusionTemplate": {
14
+ "PipelineType": "StableDiffusionXL",
15
+ "ModelType": "Base",
16
+ "SampleSize": 1024,
17
+ "TokenizerLength": 768,
18
+ "DiffuserTypes": [
19
+ "TextToImage",
20
+ "ImageToImage",
21
+ "ImageInpaintLegacy"
22
+ ],
23
+ "SchedulerDefaults": {
24
+ "SchedulerType": "EulerAncestral",
25
+ "Steps": 30,
26
+ "StepsMin": 4,
27
+ "StepsMax": 100,
28
+ "Guidance": 4,
29
+ "GuidanceMin": 0,
30
+ "GuidanceMax": 30,
31
+ "TimestepSpacing": "Linspace",
32
+ "BetaSchedule": "ScaledLinear",
33
+ "BetaStart": 0.00085,
34
+ "BetaEnd": 0.012
35
+ }
36
+ },
37
+ "Precision": "F16",
38
+ "MemoryMin": 6,
39
+ "MemoryMax": 14,
40
+ "DownloadSize": 11.2,
41
+ "Website": "https://civitai.com/models/226533?modelVersionId=481914",
42
+ "Repository": "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx",
43
+ "RepositoryFiles": [
44
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/controlnet/model.onnx",
45
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/controlnet/model.onnx.data",
46
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/controlnet/config.json",
47
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/scheduler/scheduler_config.json",
48
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/text_encoder/model.onnx",
49
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/text_encoder/config.json",
50
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/text_encoder_2/model.onnx",
51
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/text_encoder_2/config.json",
52
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer/merges.txt",
53
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer/model.onnx",
54
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer/special_tokens_map.json",
55
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer/tokenizer_config.json",
56
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer/vocab.json",
57
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer_2/merges.txt",
58
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer_2/model.onnx",
59
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer_2/special_tokens_map.json",
60
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer_2/tokenizer_config.json",
61
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/tokenizer_2/vocab.json",
62
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/unet/model.onnx",
63
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/unet/model.onnx.data",
64
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/unet/config.json",
65
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/vae_decoder/model.onnx",
66
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/vae_decoder/config.json",
67
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/vae_encoder/model.onnx",
68
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/vae_encoder/config.json",
69
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/model_index.json",
70
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/model_template.json",
71
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/README.md"
72
+ ],
73
+ "PreviewImages": [
74
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/Sample.png",
75
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/Sample2.png",
76
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/Sample3.png",
77
+ "https://huggingface.co/TensorStack/iNiverseMix-XL-onnx/resolve/main/Sample4.png"
78
+ ],
79
+ "Tags": [
80
+ "GPU",
81
+ "F16"
82
+ ]
83
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "EulerDiscreteScheduler",
3
+ "_diffusers_version": "0.29.0.dev0",
4
+ "beta_end": 0.012,
5
+ "beta_schedule": "scaled_linear",
6
+ "beta_start": 0.00085,
7
+ "clip_sample": false,
8
+ "final_sigmas_type": "zero",
9
+ "interpolation_type": "linear",
10
+ "num_train_timesteps": 1000,
11
+ "prediction_type": "epsilon",
12
+ "rescale_betas_zero_snr": false,
13
+ "sample_max_value": 1.0,
14
+ "set_alpha_to_one": false,
15
+ "sigma_max": null,
16
+ "sigma_min": null,
17
+ "skip_prk_steps": true,
18
+ "steps_offset": 1,
19
+ "timestep_spacing": "leading",
20
+ "timestep_type": "discrete",
21
+ "trained_betas": null,
22
+ "use_karras_sigmas": false
23
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModel"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "quick_gelu",
10
+ "hidden_size": 768,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "float16",
22
+ "transformers_version": "4.41.2",
23
+ "vocab_size": 49408
24
+ }
text_encoder/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5d36b62db38bba1409973b6f88e9e34cf0a8bc22bb19cb9a5e58944d0f633ef
3
+ size 246481009
text_encoder_2/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModelWithProjection"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_size": 1280,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 5120,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 20,
18
+ "num_hidden_layers": 32,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 1280,
21
+ "torch_dtype": "float16",
22
+ "transformers_version": "4.41.2",
23
+ "vocab_size": 49408
24
+ }
text_encoder_2/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3b5254183fefc58b3a2c729f56eeafa1c1e2ac6faa00a939c0bc7fb4414d4bf
3
+ size 1390289338
tokenizer/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63b7618c80a5bd8d1ee6fe92b28e7b72dde7aaa522963ff083f284501a9ec7df
3
+ size 1683233
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<|endoftext|>",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "49406": {
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "49407": {
13
+ "content": "<|endoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "bos_token": "<|startoftext|>",
22
+ "clean_up_tokenization_spaces": true,
23
+ "do_lower_case": true,
24
+ "eos_token": "<|endoftext|>",
25
+ "errors": "replace",
26
+ "model_max_length": 77,
27
+ "pad_token": "<|endoftext|>",
28
+ "tokenizer_class": "CLIPTokenizer",
29
+ "unk_token": "<|endoftext|>"
30
+ }
tokenizer/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_2/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_2/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63b7618c80a5bd8d1ee6fe92b28e7b72dde7aaa522963ff083f284501a9ec7df
3
+ size 1683233
tokenizer_2/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "!",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer_2/tokenizer_config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "!",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "49406": {
13
+ "content": "<|startoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "49407": {
21
+ "content": "<|endoftext|>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "bos_token": "<|startoftext|>",
30
+ "clean_up_tokenization_spaces": true,
31
+ "do_lower_case": true,
32
+ "eos_token": "<|endoftext|>",
33
+ "errors": "replace",
34
+ "model_max_length": 77,
35
+ "pad_token": "!",
36
+ "tokenizer_class": "CLIPTokenizer",
37
+ "unk_token": "<|endoftext|>"
38
+ }
tokenizer_2/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
unet/config.json ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.29.0.dev0",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
+ "attention_type": "default",
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "center_input_sample": false,
20
+ "class_embed_type": null,
21
+ "class_embeddings_concat": false,
22
+ "conv_in_kernel": 3,
23
+ "conv_out_kernel": 3,
24
+ "cross_attention_dim": 2048,
25
+ "cross_attention_norm": null,
26
+ "down_block_types": [
27
+ "DownBlock2D",
28
+ "CrossAttnDownBlock2D",
29
+ "CrossAttnDownBlock2D"
30
+ ],
31
+ "downsample_padding": 1,
32
+ "dropout": 0.0,
33
+ "dual_cross_attention": false,
34
+ "encoder_hid_dim": null,
35
+ "encoder_hid_dim_type": null,
36
+ "flip_sin_to_cos": true,
37
+ "freq_shift": 0,
38
+ "in_channels": 4,
39
+ "layers_per_block": 2,
40
+ "mid_block_only_cross_attention": null,
41
+ "mid_block_scale_factor": 1,
42
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "out_channels": 4,
49
+ "projection_class_embeddings_input_dim": 2816,
50
+ "resnet_out_scale_factor": 1.0,
51
+ "resnet_skip_time_act": false,
52
+ "resnet_time_scale_shift": "default",
53
+ "reverse_transformer_layers_per_block": null,
54
+ "sample_size": 128,
55
+ "time_cond_proj_dim": null,
56
+ "time_embedding_act_fn": null,
57
+ "time_embedding_dim": null,
58
+ "time_embedding_type": "positional",
59
+ "timestep_post_act": null,
60
+ "transformer_layers_per_block": [
61
+ 1,
62
+ 2,
63
+ 10
64
+ ],
65
+ "up_block_types": [
66
+ "CrossAttnUpBlock2D",
67
+ "CrossAttnUpBlock2D",
68
+ "UpBlock2D"
69
+ ],
70
+ "upcast_attention": null,
71
+ "use_linear_projection": true
72
+ }
unet/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d6782f91b2c57891aaf2fd4146141fc86f63d8bf9bc25a86e5b91d422361d4b
3
+ size 1242150
unet/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d363ee8e221f8cb43449dea18f60b058e1f23117f24acef32ffd5f6c2c504b4
3
+ size 5134903040
vae_decoder/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.26.3",
4
+ "act_fn": "silu",
5
+ "block_out_channels": [
6
+ 128,
7
+ 256,
8
+ 512,
9
+ 512
10
+ ],
11
+ "down_block_types": [
12
+ "DownEncoderBlock2D",
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D"
16
+ ],
17
+ "force_upcast": true,
18
+ "in_channels": 3,
19
+ "latent_channels": 4,
20
+ "layers_per_block": 2,
21
+ "norm_num_groups": 32,
22
+ "out_channels": 3,
23
+ "sample_size": 1024,
24
+ "scaling_factor": 0.13025,
25
+ "up_block_types": [
26
+ "UpDecoderBlock2D",
27
+ "UpDecoderBlock2D",
28
+ "UpDecoderBlock2D",
29
+ "UpDecoderBlock2D"
30
+ ]
31
+ }
vae_decoder/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97c3b5b7642de95f51650f3c59d202d1e80ad10c44252c21ab237ff020a2e8d8
3
+ size 99039207
vae_encoder/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.26.3",
4
+ "act_fn": "silu",
5
+ "block_out_channels": [
6
+ 128,
7
+ 256,
8
+ 512,
9
+ 512
10
+ ],
11
+ "down_block_types": [
12
+ "DownEncoderBlock2D",
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D"
16
+ ],
17
+ "force_upcast": true,
18
+ "in_channels": 3,
19
+ "latent_channels": 4,
20
+ "layers_per_block": 2,
21
+ "norm_num_groups": 32,
22
+ "out_channels": 3,
23
+ "sample_size": 1024,
24
+ "scaling_factor": 0.13025,
25
+ "up_block_types": [
26
+ "UpDecoderBlock2D",
27
+ "UpDecoderBlock2D",
28
+ "UpDecoderBlock2D",
29
+ "UpDecoderBlock2D"
30
+ ]
31
+ }
vae_encoder/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bc1a62d3f6689ad6441c1867343ce1986b252edb72f45c083a8740bfd6e2a91
3
+ size 68391734