| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| from typing import List |
|
|
| import attrs |
|
|
| from .lazy_config_init import LazyDict |
|
|
|
|
| @attrs.define(slots=False) |
| class DefaultModelConfig: |
| tokenizer: LazyDict = None |
| conditioner: LazyDict = None |
| net: LazyDict = None |
| sigma_data: float = 0.5 |
| precision: str = "bfloat16" |
| input_data_key: str = "video" |
| latent_shape: List[int] = [16, 24, 44, 80] |
|
|
|
|
| @attrs.define(slots=False) |
| class LatentDiffusionDecoderModelConfig(DefaultModelConfig): |
| tokenizer_corruptor: LazyDict = None |
| latent_corruptor: LazyDict = None |
| pixel_corruptor: LazyDict = None |
| diffusion_decoder_cond_sigma_low: float = None |
| diffusion_decoder_cond_sigma_high: float = None |
| diffusion_decoder_corrupt_prob: float = None |
| condition_on_tokenizer_corruptor_token: bool = False |
|
|