| model: | |
| model_id: dcae | |
| sample_size: | |
| - 360 | |
| - 640 | |
| channels: 3 | |
| latent_size: 32 | |
| latent_channels: 16 | |
| ch_0: 64 | |
| ch_max: 256 | |
| encoder_blocks_per_stage: | |
| - 1 | |
| - 1 | |
| - 1 | |
| - 1 | |
| decoder_blocks_per_stage: | |
| - 1 | |
| - 1 | |
| - 1 | |
| - 1 | |
| use_middle_block: false | |
| do_channel_mask: false | |
| skip_logvar: false | |
| train: | |
| trainer_id: distill_enc | |
| data_id: video_dir_loader | |
| data_kwargs: | |
| source: | |
| - /mnt/data/datasets/extracted_tars/kbm/fps/*/*.mp4 | |
| - /mnt/data/datasets/extracted_tars/kbm/3ps/*/*.mp4 | |
| - /mnt/data/datasets/extracted_tars/kbm/other/*/*.mp4 | |
| target_size: | |
| - 360 | |
| - 640 | |
| target_batch_size: 256 | |
| batch_size: 32 | |
| epochs: 200 | |
| opt: Muon | |
| opt_kwargs: | |
| lr: 0.0005 | |
| momentum: 0.95 | |
| adamw_lr: 0.0001 | |
| adamw_wd: 0.01 | |
| adamw_eps: 1.0e-06 | |
| adamw_betas: | |
| - 0.9 | |
| - 0.95 | |
| adamw_keys: | |
| - conv_in | |
| - conv_out | |
| - conv_out_logvar | |
| - .down. | |
| - .residuals. | |
| lpips_type: convnext | |
| loss_weights: | |
| l2: 1.0 | |
| logvar: 1.0 | |
| scheduler: LinearWarmup | |
| scheduler_kwargs: | |
| warmup_steps: 1500 | |
| min_lr: 1.0e-05 | |
| checkpoint_dir: checkpoints/waypoint_1_vae_owlc_f16_c16_enc_distill | |
| resume_ckpt: null | |
| teacher_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16/step_300000.pt | |
| teacher_cfg: configs/waypoint_1/owl_vae_f16_c16.yml | |
| sample_interval: 1000 | |
| save_interval: 5000 | |
| latent_scale: 1.0 | |
| latent_shift: 0.0 | |
| wandb: | |
| name: shahbuland | |
| project: new_vaes_v2 | |
| run_name: waypoint_1_vae_owlc_f16_c16_enc_distill_highlr | |