diff --git a/backend/vae/configs/sd15.json b/backend/vae/configs/sd15.json index 89300be9..61c28dc4 100644 --- a/backend/vae/configs/sd15.json +++ b/backend/vae/configs/sd15.json @@ -19,6 +19,7 @@ "norm_num_groups": 32, "out_channels": 3, "sample_size": 512, + "scaling_factor": 0.18215, "up_block_types": [ "UpDecoderBlock2D", "UpDecoderBlock2D", diff --git a/backend/vae/configs/sdxl.json b/backend/vae/configs/sdxl.json new file mode 100644 index 00000000..ac908948 --- /dev/null +++ b/backend/vae/configs/sdxl.json @@ -0,0 +1,29 @@ +{ + "_class_name": "AutoencoderKL", + "act_fn": "silu", + "block_out_channels": [ + 128, + 256, + 512, + 512 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "in_channels": 3, + "latent_channels": 4, + "layers_per_block": 2, + "norm_num_groups": 32, + "out_channels": 3, + "sample_size": 1024, + "scaling_factor": 0.13025, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ] +}