| { |
| "_class_name": "CausalVAEModel", |
| "_diffusers_version": "0.27.2", |
| "attn_resolutions": [], |
| "decoder_attention": "AttnBlock3D", |
| "decoder_conv_in": "CausalConv3d", |
| "decoder_conv_out": "CausalConv3d", |
| "decoder_mid_resnet": "ResnetBlock3D", |
| "decoder_resnet_blocks": [ |
| "ResnetBlock3D", |
| "ResnetBlock3D", |
| "ResnetBlock3D", |
| "ResnetBlock3D" |
| ], |
| "decoder_spatial_upsample": [ |
| "", |
| "SpatialUpsample2x", |
| "SpatialUpsample2x", |
| "SpatialUpsample2x" |
| ], |
| "decoder_temporal_upsample": [ |
| "", |
| "", |
| "TimeUpsample2x", |
| "TimeUpsample2x" |
| ], |
| "double_z": true, |
| "dropout": 0.0, |
| "embed_dim": 4, |
| "encoder_attention": "AttnBlock3D", |
| "encoder_conv_in": "CausalConv3d", |
| "encoder_conv_out": "CausalConv3d", |
| "encoder_mid_resnet": "ResnetBlock3D", |
| "encoder_resnet_blocks": [ |
| "ResnetBlock3D", |
| "ResnetBlock3D", |
| "ResnetBlock3D", |
| "ResnetBlock3D" |
| ], |
| "encoder_spatial_downsample": [ |
| "SpatialDownsample2x", |
| "SpatialDownsample2x", |
| "SpatialDownsample2x", |
| "" |
| ], |
| "encoder_temporal_downsample": [ |
| "TimeDownsample2x", |
| "TimeDownsample2x", |
| "", |
| "" |
| ], |
| "hidden_size": 128, |
| "hidden_size_mult": [ |
| 1, |
| 2, |
| 4, |
| 4 |
| ], |
| "loss_params": { |
| "disc_start": 2001, |
| "disc_weight": 0.5, |
| "kl_weight": 1e-06, |
| "logvar_init": 0.0 |
| }, |
| "loss_type": "models.videovae.losses.LPIPSWithDiscriminator", |
| "lr": 1e-05, |
| "num_res_blocks": 2, |
| "q_conv": "CausalConv3d", |
| "resolution": 256, |
| "z_channels": 4 |
| } |
|
|