{ "_class_name": "CausalVideoVAE", "_diffusers_version": "0.29.2", "add_post_quant_conv": true, "decoder_act_fn": "silu", "decoder_block_dropout": [ 0.0, 0.0, 0.0, 0.0 ], "decoder_block_out_channels": [ 128, 256, 512, 512 ], "decoder_in_channels": 16, "decoder_layers_per_block": [ 3, 3, 3, 3 ], "decoder_norm_num_groups": 32, "decoder_out_channels": 3, "decoder_spatial_up_sample": [ true, true, true, false ], "decoder_temporal_up_sample": [ true, true, true, false ], "decoder_type": "causal_vae_conv", "decoder_up_block_types": [ "UpDecoderBlockCausal3D", "UpDecoderBlockCausal3D", "UpDecoderBlockCausal3D", "UpDecoderBlockCausal3D" ], "downsample_scale": 8, "encoder_act_fn": "silu", "encoder_block_dropout": [ 0.0, 0.0, 0.0, 0.0 ], "encoder_block_out_channels": [ 128, 256, 512, 512 ], "encoder_double_z": true, "encoder_down_block_types": [ "DownEncoderBlockCausal3D", "DownEncoderBlockCausal3D", "DownEncoderBlockCausal3D", "DownEncoderBlockCausal3D" ], "encoder_in_channels": 3, "encoder_layers_per_block": [ 2, 2, 2, 2 ], "encoder_norm_num_groups": 32, "encoder_out_channels": 16, "encoder_spatial_down_sample": [ true, true, true, false ], "encoder_temporal_down_sample": [ true, true, true, false ], "encoder_type": "causal_vae_conv", "interpolate": false, "sample_size": 256, "scaling_factor": 0.13025 }