diff --git a/checkpoint-13000/optimizer.bin b/checkpoint-13000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..53a1a9d17538548ce3727feba8922ed0e7399f92 --- /dev/null +++ b/checkpoint-13000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c487220a5691d7038899eb1224db72c38f20bdbc67e1805ff2ba5bca5e030e5d +size 6876750164 diff --git a/checkpoint-13000/random_states_0.pkl b/checkpoint-13000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9f9dc1e88b010ac14bfed86d46eda1f88dbf927e --- /dev/null +++ b/checkpoint-13000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0089108873fd3f1346f02c61dae5598d4d90ff10336fd9bb260ba2e56c20b812 +size 14344 diff --git a/checkpoint-13000/scaler.pt b/checkpoint-13000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ced4b569621b283ab409fa5e41736fc0a8f43e6 --- /dev/null +++ b/checkpoint-13000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77f98967818acefa7b6b48d86d0635b780ab57badf525d74c7b5b70c8009b64 +size 988 diff --git a/checkpoint-13000/scheduler.bin b/checkpoint-13000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..659b3049676d8887e114b4cdf874d15663f36c0b --- /dev/null +++ b/checkpoint-13000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee961ed5cbbe8aa04a6a17bc82eac799c17a3005fb0cfac625144c54ed464102 +size 1000 diff --git a/checkpoint-13000/unet/config.json b/checkpoint-13000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca24297c0b035dfc4d0b825081594383b1eddb88 --- /dev/null +++ b/checkpoint-13000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-13000/unet/diffusion_pytorch_model.safetensors b/checkpoint-13000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..400b1a1854983ade4260f9accd270b33ade8b2d2 --- /dev/null +++ b/checkpoint-13000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf36a9d67a678d985c74552d97242687f2a247dcb64e8a7a5052d7286798bf1 +size 3438167536 diff --git a/checkpoint-13000/unet_ema/config.json b/checkpoint-13000/unet_ema/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ee9c00042af4c9a9aeecafaecf44284d98e74ac9 --- /dev/null +++ b/checkpoint-13000/unet_ema/config.json @@ -0,0 +1,75 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "decay": 0.9999, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "inv_gamma": 1.0, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "min_decay": 0.0, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "optimization_step": 13000, + "out_channels": 4, + "power": 0.6666666666666666, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "update_after_step": 0, + "use_ema_warmup": false, + "use_linear_projection": false +} diff --git a/checkpoint-13000/unet_ema/diffusion_pytorch_model.safetensors b/checkpoint-13000/unet_ema/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b378bc6e202457abd80837f3442da8bf3ec8f918 --- /dev/null +++ b/checkpoint-13000/unet_ema/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904ee3d6e0f9d629e895ba3fd0c2a589c50a655018db4f4b18b39ab9a55323d9 +size 3438167536 diff --git a/checkpoint-13000/vae/config.json b/checkpoint-13000/vae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..597580bf2ac46222b64ffc672c4aeeddb866bb12 --- /dev/null +++ b/checkpoint-13000/vae/config.json @@ -0,0 +1,37 @@ +{ + "_class_name": "AutoencoderKL", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "rcannizzaro/vae-dsprites", + "act_fn": "silu", + "block_out_channels": [ + 128, + 256, + 512, + 512 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "force_upcast": true, + "in_channels": 1, + "latent_channels": 4, + "latents_mean": null, + "latents_std": null, + "layers_per_block": 2, + "norm_num_groups": 32, + "out_channels": 1, + "sample_size": 64, + "scaling_factor": 0.18215, + "shift_factor": null, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ], + "use_post_quant_conv": true, + "use_quant_conv": true +} diff --git a/checkpoint-13000/vae/diffusion_pytorch_model.safetensors b/checkpoint-13000/vae/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a95c994af80b5b3f4e63cfe02ea49184ed8d0a2 --- /dev/null +++ b/checkpoint-13000/vae/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124e03ac01b9dc178e97f0ef8bd78539194858856567294e860259c0e778063e +size 334624828 diff --git a/checkpoint-13500/optimizer.bin b/checkpoint-13500/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..57b1fbbc7e5288b3c0a14b627bc8782ac6e518fc --- /dev/null +++ b/checkpoint-13500/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8ba608bca755f0e6a7648d74dc6bbed7461ffd0db65a6b8062ba28038023f7a +size 6876750164 diff --git a/checkpoint-13500/random_states_0.pkl b/checkpoint-13500/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..89cc3d3a746fea142d9668f0831ba95390e4c1de --- /dev/null +++ b/checkpoint-13500/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9587c2b41eb399eb06818493499019683a068e886c9d5e7feb011969ab78e493 +size 14344 diff --git a/checkpoint-13500/scaler.pt b/checkpoint-13500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..025e7ede23687ba6f87d08eab5f099a2f269162d --- /dev/null +++ b/checkpoint-13500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb4ee3801b11e2b95773f86abaa2d1e4b1da1e9da1588595ee5a4248d6798c1 +size 988 diff --git a/checkpoint-13500/scheduler.bin b/checkpoint-13500/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..0060ee0f5b994fa866429ec769616a7f7271d01e --- /dev/null +++ b/checkpoint-13500/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2cb44ffda49b78703f527708e5b05c7884d2efe41a1c8eb6872d68852fa4d1 +size 1000 diff --git a/checkpoint-13500/unet/config.json b/checkpoint-13500/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca24297c0b035dfc4d0b825081594383b1eddb88 --- /dev/null +++ b/checkpoint-13500/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-13500/unet/diffusion_pytorch_model.safetensors b/checkpoint-13500/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..25811a13e3083dd2e8d921c41b1d6f49cf5f1cf9 --- /dev/null +++ b/checkpoint-13500/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f74a144c14b92f1b47be309e836d63d1885b76578299d9b36e7ab990d214db +size 3438167536 diff --git a/checkpoint-13500/unet_ema/config.json b/checkpoint-13500/unet_ema/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7034068cbed87991dea0002c244563a5a4cffc24 --- /dev/null +++ b/checkpoint-13500/unet_ema/config.json @@ -0,0 +1,75 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "decay": 0.9999, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "inv_gamma": 1.0, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "min_decay": 0.0, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "optimization_step": 13500, + "out_channels": 4, + "power": 0.6666666666666666, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "update_after_step": 0, + "use_ema_warmup": false, + "use_linear_projection": false +} diff --git a/checkpoint-13500/unet_ema/diffusion_pytorch_model.safetensors b/checkpoint-13500/unet_ema/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64d0410f3de7e8c2cd40c47c529a77bdf68d777f --- /dev/null +++ b/checkpoint-13500/unet_ema/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37eb6b33d642d6fcf248025790b122657ea9f0eabaee81febfdbe7ee562aafe3 +size 3438167536 diff --git a/checkpoint-13500/vae/config.json b/checkpoint-13500/vae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..597580bf2ac46222b64ffc672c4aeeddb866bb12 --- /dev/null +++ b/checkpoint-13500/vae/config.json @@ -0,0 +1,37 @@ +{ + "_class_name": "AutoencoderKL", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "rcannizzaro/vae-dsprites", + "act_fn": "silu", + "block_out_channels": [ + 128, + 256, + 512, + 512 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "force_upcast": true, + "in_channels": 1, + "latent_channels": 4, + "latents_mean": null, + "latents_std": null, + "layers_per_block": 2, + "norm_num_groups": 32, + "out_channels": 1, + "sample_size": 64, + "scaling_factor": 0.18215, + "shift_factor": null, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ], + "use_post_quant_conv": true, + "use_quant_conv": true +} diff --git a/checkpoint-13500/vae/diffusion_pytorch_model.safetensors b/checkpoint-13500/vae/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a95c994af80b5b3f4e63cfe02ea49184ed8d0a2 --- /dev/null +++ b/checkpoint-13500/vae/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124e03ac01b9dc178e97f0ef8bd78539194858856567294e860259c0e778063e +size 334624828 diff --git a/checkpoint-14000/optimizer.bin b/checkpoint-14000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..200f60380b30b64605148a3806950b15e7fa48ec --- /dev/null +++ b/checkpoint-14000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccba29fb3c05b8a05590323f7b848bed569abe64416dd00f091dc23a47f88e82 +size 6876750164 diff --git a/checkpoint-14000/random_states_0.pkl b/checkpoint-14000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..7ed1b61c8ae7ce2a775637eda20e006e9f6d0e84 --- /dev/null +++ b/checkpoint-14000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e532f5e339f687ada4ad0f4e12635843b2122d19ad4381f2f1a38cad5580894 +size 14344 diff --git a/checkpoint-14000/scaler.pt b/checkpoint-14000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b662b51676a156b87defef3451e7cf318983cd7 --- /dev/null +++ b/checkpoint-14000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8972e137dff582ed156c48a434d8d5304443a88bca38ef8e7f0e80298e6f0533 +size 988 diff --git a/checkpoint-14000/scheduler.bin b/checkpoint-14000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..7cb7a98ef3fb5a5b91435413f3326eda689ec709 --- /dev/null +++ b/checkpoint-14000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee032204bba8930df676bada22732e1d1d4fce2e74de1dd6725c0a0c5840cb19 +size 1000 diff --git a/checkpoint-14000/unet/config.json b/checkpoint-14000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca24297c0b035dfc4d0b825081594383b1eddb88 --- /dev/null +++ b/checkpoint-14000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-14000/unet/diffusion_pytorch_model.safetensors b/checkpoint-14000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..800dea07f7ddc7eceb81a19e8396db028cb31a63 --- /dev/null +++ b/checkpoint-14000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d3f7550d7c125ef344f1709f27859d7c0d217e302539f2547928abc031b7a2e +size 3438167536 diff --git a/checkpoint-14000/unet_ema/config.json b/checkpoint-14000/unet_ema/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f8088713ab9a40174234b5b0fd4c1cac2f1ed569 --- /dev/null +++ b/checkpoint-14000/unet_ema/config.json @@ -0,0 +1,75 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "decay": 0.9999, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "inv_gamma": 1.0, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "min_decay": 0.0, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "optimization_step": 14000, + "out_channels": 4, + "power": 0.6666666666666666, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "update_after_step": 0, + "use_ema_warmup": false, + "use_linear_projection": false +} diff --git a/checkpoint-14000/unet_ema/diffusion_pytorch_model.safetensors b/checkpoint-14000/unet_ema/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f14668e6cb8c6379bf337f71ccf791293dd3a9f3 --- /dev/null +++ b/checkpoint-14000/unet_ema/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42f619f1c6cf854ca46a34563a4e2de800640efce334d19fa20c11d0c0ce969 +size 3438167536 diff --git a/checkpoint-14000/vae/config.json b/checkpoint-14000/vae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..597580bf2ac46222b64ffc672c4aeeddb866bb12 --- /dev/null +++ b/checkpoint-14000/vae/config.json @@ -0,0 +1,37 @@ +{ + "_class_name": "AutoencoderKL", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "rcannizzaro/vae-dsprites", + "act_fn": "silu", + "block_out_channels": [ + 128, + 256, + 512, + 512 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "force_upcast": true, + "in_channels": 1, + "latent_channels": 4, + "latents_mean": null, + "latents_std": null, + "layers_per_block": 2, + "norm_num_groups": 32, + "out_channels": 1, + "sample_size": 64, + "scaling_factor": 0.18215, + "shift_factor": null, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ], + "use_post_quant_conv": true, + "use_quant_conv": true +} diff --git a/checkpoint-14000/vae/diffusion_pytorch_model.safetensors b/checkpoint-14000/vae/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a95c994af80b5b3f4e63cfe02ea49184ed8d0a2 --- /dev/null +++ b/checkpoint-14000/vae/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124e03ac01b9dc178e97f0ef8bd78539194858856567294e860259c0e778063e +size 334624828 diff --git a/checkpoint-14500/optimizer.bin b/checkpoint-14500/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..94a2dea71f8d27698092249f36a7d067eba1ce3f --- /dev/null +++ b/checkpoint-14500/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749295ded5ab87b9bf97185a46cffaf01b533b06abadf9b7f4250c188b417ef0 +size 6876750164 diff --git a/checkpoint-14500/random_states_0.pkl b/checkpoint-14500/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..2c6974591c52c64e3f4908b152cb2995978898eb --- /dev/null +++ b/checkpoint-14500/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca062bde709a8c2e3306a170bc711717001272ac9d16e25e0dfe65361436f309 +size 14344 diff --git a/checkpoint-14500/scaler.pt b/checkpoint-14500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..92e6df6461226c7c7dd6dd7a0004d1b6591aacbd --- /dev/null +++ b/checkpoint-14500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa669548d7d0cea54c34bbdeb3defa489898ad7ca32a778f0f5d4793a93394b +size 988 diff --git a/checkpoint-14500/scheduler.bin b/checkpoint-14500/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb6f5fc01daa72256dfedd087eef947d0cd50430 --- /dev/null +++ b/checkpoint-14500/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5e0896943f37464e5d7e427828d84c5c72a094175a2c126366fdfe945c9e33 +size 1000 diff --git a/checkpoint-14500/unet/config.json b/checkpoint-14500/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca24297c0b035dfc4d0b825081594383b1eddb88 --- /dev/null +++ b/checkpoint-14500/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-14500/unet/diffusion_pytorch_model.safetensors b/checkpoint-14500/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b19b457f90a53033d6c8f87470b5756d7c757b80 --- /dev/null +++ b/checkpoint-14500/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27afd75200ecc1ce9b84f87e921de245615aba50ee9e77004f7828365bea22c +size 3438167536 diff --git a/checkpoint-14500/unet_ema/config.json b/checkpoint-14500/unet_ema/config.json new file mode 100644 index 0000000000000000000000000000000000000000..349f6e9fc73225ccafd33ef7bf2279f714db949c --- /dev/null +++ b/checkpoint-14500/unet_ema/config.json @@ -0,0 +1,75 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "decay": 0.9999, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "inv_gamma": 1.0, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "min_decay": 0.0, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "optimization_step": 14500, + "out_channels": 4, + "power": 0.6666666666666666, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "update_after_step": 0, + "use_ema_warmup": false, + "use_linear_projection": false +} diff --git a/checkpoint-14500/unet_ema/diffusion_pytorch_model.safetensors b/checkpoint-14500/unet_ema/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1aaadf83a515338934cc23481fd5eeba189ce0ee --- /dev/null +++ b/checkpoint-14500/unet_ema/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e03add9eaaeffd64db56d67ed98704617f73f415eceeb7ba904b490a6eb12bd +size 3438167536 diff --git a/checkpoint-14500/vae/config.json b/checkpoint-14500/vae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..597580bf2ac46222b64ffc672c4aeeddb866bb12 --- /dev/null +++ b/checkpoint-14500/vae/config.json @@ -0,0 +1,37 @@ +{ + "_class_name": "AutoencoderKL", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "rcannizzaro/vae-dsprites", + "act_fn": "silu", + "block_out_channels": [ + 128, + 256, + 512, + 512 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "force_upcast": true, + "in_channels": 1, + "latent_channels": 4, + "latents_mean": null, + "latents_std": null, + "layers_per_block": 2, + "norm_num_groups": 32, + "out_channels": 1, + "sample_size": 64, + "scaling_factor": 0.18215, + "shift_factor": null, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ], + "use_post_quant_conv": true, + "use_quant_conv": true +} diff --git a/checkpoint-14500/vae/diffusion_pytorch_model.safetensors b/checkpoint-14500/vae/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a95c994af80b5b3f4e63cfe02ea49184ed8d0a2 --- /dev/null +++ b/checkpoint-14500/vae/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124e03ac01b9dc178e97f0ef8bd78539194858856567294e860259c0e778063e +size 334624828 diff --git a/checkpoint-15000/optimizer.bin b/checkpoint-15000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..aed81f3fb6471b17c2b75bf3791c9272e6d371d9 --- /dev/null +++ b/checkpoint-15000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1945bb0627b2b7f1181ddea41b0c2d2122c7abab95e1348356492056e119d3 +size 6876750164 diff --git a/checkpoint-15000/random_states_0.pkl b/checkpoint-15000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..147f1f4a57ffde1282da60095338ebe3de269d0e --- /dev/null +++ b/checkpoint-15000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc1a4ebe3defb6e96618c9203e8e7e9a1f611eb879a37dd2cd1c52b1055587e5 +size 14344 diff --git a/checkpoint-15000/scaler.pt b/checkpoint-15000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..365015aeee3b31cbc062de74953db1994e36a224 --- /dev/null +++ b/checkpoint-15000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2491380f0b55e3e8cbfec1654220a94cf6d79d50cd1b1e51dfe593c04a274cb9 +size 988 diff --git a/checkpoint-15000/scheduler.bin b/checkpoint-15000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b446f749a0637774df7577a25badd8627d7bdcf --- /dev/null +++ b/checkpoint-15000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f8cb1c00499c9a11be98e1d3df14acb1c3f608844e19988fc0598608b723e0 +size 1000 diff --git a/checkpoint-15000/unet/config.json b/checkpoint-15000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca24297c0b035dfc4d0b825081594383b1eddb88 --- /dev/null +++ b/checkpoint-15000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-15000/unet/diffusion_pytorch_model.safetensors b/checkpoint-15000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..075f0f597f090681276529fb5b69a48d57bc8cae --- /dev/null +++ b/checkpoint-15000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72eb227af31c16d1fda6cce53a407e485e65f7a61bdb672f32f253165f7bfe54 +size 3438167536 diff --git a/checkpoint-15000/unet_ema/config.json b/checkpoint-15000/unet_ema/config.json new file mode 100644 index 0000000000000000000000000000000000000000..338822d508533950409036a8eabde9a2dc092a6d --- /dev/null +++ b/checkpoint-15000/unet_ema/config.json @@ -0,0 +1,75 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "runwayml/stable-diffusion-v1-5", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "decay": 0.9999, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "inv_gamma": 1.0, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "min_decay": 0.0, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "optimization_step": 15000, + "out_channels": 4, + "power": 0.6666666666666666, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "update_after_step": 0, + "use_ema_warmup": false, + "use_linear_projection": false +} diff --git a/checkpoint-15000/unet_ema/diffusion_pytorch_model.safetensors b/checkpoint-15000/unet_ema/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5703415712e11e74d101bb8305347faefac39249 --- /dev/null +++ b/checkpoint-15000/unet_ema/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56736dfcb35729ebdb67661af898dcbc8cb94e446707ee4e3dfe22aa75a2c9a +size 3438167536 diff --git a/checkpoint-15000/vae/config.json b/checkpoint-15000/vae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..597580bf2ac46222b64ffc672c4aeeddb866bb12 --- /dev/null +++ b/checkpoint-15000/vae/config.json @@ -0,0 +1,37 @@ +{ + "_class_name": "AutoencoderKL", + "_diffusers_version": "0.30.0.dev0", + "_name_or_path": "rcannizzaro/vae-dsprites", + "act_fn": "silu", + "block_out_channels": [ + 128, + 256, + 512, + 512 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "force_upcast": true, + "in_channels": 1, + "latent_channels": 4, + "latents_mean": null, + "latents_std": null, + "layers_per_block": 2, + "norm_num_groups": 32, + "out_channels": 1, + "sample_size": 64, + "scaling_factor": 0.18215, + "shift_factor": null, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ], + "use_post_quant_conv": true, + "use_quant_conv": true +} diff --git a/checkpoint-15000/vae/diffusion_pytorch_model.safetensors b/checkpoint-15000/vae/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a95c994af80b5b3f4e63cfe02ea49184ed8d0a2 --- /dev/null +++ b/checkpoint-15000/vae/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124e03ac01b9dc178e97f0ef8bd78539194858856567294e860259c0e778063e +size 334624828 diff --git a/unet/diffusion_pytorch_model.safetensors b/unet/diffusion_pytorch_model.safetensors index 7227ba1d9d1066ec5facb09e1c142fb8ed0bf2b3..5703415712e11e74d101bb8305347faefac39249 100644 --- a/unet/diffusion_pytorch_model.safetensors +++ b/unet/diffusion_pytorch_model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0921981c3e131d2e04bf9ce534cd42f6a14dd2acc04f75e9e42026031b9f8b37 +oid sha256:f56736dfcb35729ebdb67661af898dcbc8cb94e446707ee4e3dfe22aa75a2c9a size 3438167536 diff --git a/val_imgs_grid.png b/val_imgs_grid.png index 773577a4fe4314c95c5da9a5c5a720070985e532..27d5e48c3c310fb9e7dc91a3a720adb7270f97c5 100644 Binary files a/val_imgs_grid.png and b/val_imgs_grid.png differ