shahbuland's picture
Upload folder using huggingface_hub
ba93215 verified
Raw
History Blame Contribute Delete
1.49 kB
model:
model_id: dcae
sample_size:
- 360
- 640
channels: 3
latent_size: 32
latent_channels: 16
ch_0: 64
ch_max: 256
encoder_blocks_per_stage:
- 1
- 1
- 1
- 1
decoder_blocks_per_stage:
- 1
- 1
- 1
- 1
use_middle_block: false
do_channel_mask: false
skip_logvar: false
train:
trainer_id: distill_enc
data_id: video_dir_loader
data_kwargs:
source:
- /mnt/data/datasets/extracted_tars/kbm/fps/*/*.mp4
- /mnt/data/datasets/extracted_tars/kbm/3ps/*/*.mp4
- /mnt/data/datasets/extracted_tars/kbm/other/*/*.mp4
target_size:
- 360
- 640
target_batch_size: 256
batch_size: 32
epochs: 200
opt: Muon
opt_kwargs:
lr: 0.0005
momentum: 0.95
adamw_lr: 0.0001
adamw_wd: 0.01
adamw_eps: 1.0e-06
adamw_betas:
- 0.9
- 0.95
adamw_keys:
- conv_in
- conv_out
- conv_out_logvar
- .down.
- .residuals.
lpips_type: convnext
loss_weights:
l2: 1.0
logvar: 1.0
scheduler: LinearWarmup
scheduler_kwargs:
warmup_steps: 1500
min_lr: 1.0e-05
checkpoint_dir: checkpoints/waypoint_1_vae_owlc_f16_c16_enc_distill
resume_ckpt: null
teacher_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16/step_300000.pt
teacher_cfg: configs/waypoint_1/owl_vae_f16_c16.yml
sample_interval: 1000
save_interval: 5000
latent_scale: 1.0
latent_shift: 0.0
wandb:
name: shahbuland
project: new_vaes_v2
run_name: waypoint_1_vae_owlc_f16_c16_enc_distill_highlr