| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| |
|
| | from hydra.core.config_store import ConfigStore |
| |
|
| | from .ar_diffusion_decoder_network import DiffusionDecoderGeneralDIT |
| | from .lazy_config_init import LazyCall as L |
| | from .lazy_config_init import LazyDict |
| |
|
| | num_frames = 57 |
| | Cosmos_DiffusionDecoder_7B_INFERENCE_ONLY: LazyDict = LazyDict( |
| | dict( |
| | defaults=[ |
| | {"override /net": "faditv2_7b"}, |
| | {"override /tokenizer": "cosmos_video_tokenizer_res720_comp8x8x8_t121_ver092624"}, |
| | {"override /conditioner": "video_latent_diffusion_decoder_cond"}, |
| | {"override /tokenizer_corruptor": "cosmos_video_discrete_tokenizer_res720_comp8x16x16_t49_ver110224"}, |
| | "_self_", |
| | ], |
| | job=dict( |
| | group="diffusion_deocder_FT_7Bv1_001", |
| | name="DD_FT_7Bv1_003_002_tokenizer888_spatch2_discrete_cond_on_token", |
| | ), |
| | model=dict( |
| | diffusion_decoder_cond_sigma_low=0.0, |
| | diffusion_decoder_cond_sigma_high=0.0, |
| | diffusion_decoder_corrupt_prob=0.0, |
| | condition_on_tokenizer_corruptor_token=True, |
| | latent_shape=[ |
| | 16, |
| | num_frames, |
| | 88, |
| | 160, |
| | ], |
| | tokenizer_corruptor=dict( |
| | pixel_chunk_duration=num_frames, |
| | latent_chunk_duration=1 + (num_frames - 1) // 8, |
| | ), |
| | net=L(DiffusionDecoderGeneralDIT)( |
| | diffusion_decoder_condition_on_sigma=False, |
| | max_img_h=240, |
| | max_img_w=240, |
| | rope_h_extrapolation_ratio=1.5, |
| | rope_w_extrapolation_ratio=1.5, |
| | rope_t_extrapolation_ratio=1, |
| | block_x_format="THWBD", |
| | is_diffusion_decoder=True, |
| | patch_spatial=2, |
| | diffusion_decoder_condition_on_token=True, |
| | diffusion_decoder_token_condition_voc_size=64000, |
| | diffusion_decoder_token_condition_dim=32, |
| | ), |
| | tokenizer=dict( |
| | video_vae=dict( |
| | pixel_chunk_duration=num_frames, |
| | ) |
| | ), |
| | conditioner=dict( |
| | latent_condition=dict( |
| | dropout_rate=0.2, |
| | ) |
| | ), |
| | ), |
| | ) |
| | ) |
| |
|
| | cs = ConfigStore.instance() |
| | cs.store( |
| | group="experiment", |
| | package="_global_", |
| | name=Cosmos_DiffusionDecoder_7B_INFERENCE_ONLY["job"]["name"], |
| | node=Cosmos_DiffusionDecoder_7B_INFERENCE_ONLY, |
| | ) |
| |
|