| dataset: point_maze |
| data_path: /data/user_data/mchen5/dino_wm_dataset/point_maze |
| pretrained_model_path: /data/hf_cache/hub/models--maxin-cn--Latte/snapshots/fc35c8c44c38e0b446158ace47e7de642066f0d9/vae |
| n_rollout: null |
| split_ratio: 0.9 |
| validation_size: 32 |
| use_wandb: true |
| results_dir: ./results |
| pretrained: null |
| model: Latte-S/2 |
| use_dynamic_tokenizer: true |
| num_slots: 256 |
| slot_dim: 16 |
| dec_hidden_size: 384 |
| dec_depth: 12 |
| dec_num_heads: 6 |
| num_frames: 4 |
| n_context_frames: 1 |
| scheduling_mode: full_sequence |
| image_size: 256 |
| num_sampling_steps: 250 |
| frame_interval: 1 |
| fixed_spatial: false |
| attention_bias: true |
| learn_sigma: false |
| diffusion_mode: diffusion_forcing |
| extras: 1 |
| use_action: true |
| action_dim: 2 |
| normalize_action: true |
| save_ceph: false |
| learning_rate: 0.0001 |
| clip_max_norm: 0.1 |
| start_clip_iter: 20000 |
| local_batch_size: 16 |
| max_train_steps: 1000000 |
| global_seed: 3407 |
| num_workers: 4 |
| log_every: 10 |
| val_every_n_steps: 1000 |
| lr_warmup_steps: 0 |
| resume_from_checkpoint: null |
| gradient_accumulation_steps: 1 |
| num_classes: null |
| use_compile: false |
| mixed_precision: 32 |
| gradient_checkpointing: true |
| sequential_loss_grad: true |
| callbacks: |
| model_checkpoint_across_timesteps: |
| every_n_train_steps: 10000 |
| save_top_k: -1 |
| save_on_train_epoch_end: true |
| save_weights_only: false |
| filename: '{epoch}-{step}' |
| model_checkpoint_latest: |
| every_n_train_steps: 1000 |
| save_top_k: 1 |
| save_on_train_epoch_end: false |
| save_weights_only: false |
| filename: latest-{epoch}-{step} |
| metrics_logger: |
| log_every_n_train_steps: 10000 |
| save_videos: true |
| evaluate: true |
| max_batchsize: 4 |
| buffer_size: 32 |
| i3d_model_path: checkpoints/i3d/i3d_torchscript.pt |
| inference_n_slots: |
| - 64 |
| - 128 |
| - 256 |
| train: true |
| validate: false |
| exp_name: tok2_comp=False_mp=32_gc=True |
| run_id: 6002143-0 |
|
|