{ "architectures": [ "VideoAutoencoderPipeline" ], "cal_loss": false, "freeze_vae_2d": false, "from_pretrained": null, "micro_frame_size": 17, "model_type": "VideoAutoencoderPipeline", "scale": [ 3.85, 2.32, 2.33, 3.06 ], "shift": [ -0.1, 0.34, 0.27, 0.98 ], "spatial_vae": { "_class_name": "AutoencoderKL", "_diffusers_version": "0.18.0.dev0", "_name_or_path": ".", "act_fn": "silu", "block_out_channels": [ 128, 256, 512, 512 ], "down_block_types": [ "DownEncoderBlock2D", "DownEncoderBlock2D", "DownEncoderBlock2D", "DownEncoderBlock2D" ], "in_channels": 3, "latent_channels": 4, "layers_per_block": 2, "norm_num_groups": 32, "out_channels": 3, "sample_size": 512, "scaling_factor": 0.13025, "up_block_types": [ "UpDecoderBlock2D", "UpDecoderBlock2D", "UpDecoderBlock2D", "UpDecoderBlock2D" ], "force_upcast": false }, "torch_dtype": "float32", "transformers_version": "4.36.2", "vae_2d": { "from_pretrained": "PixArt-alpha/pixart_sigma_sdxlvae_T5_diffusers", "local_files_only": false, "micro_batch_size": 4, "subfolder": "vae", "type": "VideoAutoencoderKL" }, "vae_temporal": { "from_pretrained": null, "type": "VAE_Temporal_SD" } }