Upload folder using huggingface_hub
Browse files- decoder.safetensors +3 -0
- decoder_conf.yml +82 -0
- encoder.safetensors +3 -0
- encoder_conf.yml +73 -0
decoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33bc72089283767d00ffc85eac8beca3f5c4158c1049ba44f3e93a188c5de6bb
|
| 3 |
+
size 278084696
|
decoder_conf.yml
ADDED
|
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model:
|
| 2 |
+
model_id: dcae
|
| 3 |
+
sample_size:
|
| 4 |
+
- 360
|
| 5 |
+
- 640
|
| 6 |
+
channels: 3
|
| 7 |
+
latent_size: 32
|
| 8 |
+
latent_channels: 16
|
| 9 |
+
ch_0: 128
|
| 10 |
+
ch_max: 1024
|
| 11 |
+
encoder_blocks_per_stage:
|
| 12 |
+
- 1
|
| 13 |
+
- 1
|
| 14 |
+
- 1
|
| 15 |
+
- 1
|
| 16 |
+
decoder_blocks_per_stage:
|
| 17 |
+
- 1
|
| 18 |
+
- 1
|
| 19 |
+
- 1
|
| 20 |
+
- 1
|
| 21 |
+
use_middle_block: false
|
| 22 |
+
do_channel_mask: false
|
| 23 |
+
skip_logvar: false
|
| 24 |
+
discriminator:
|
| 25 |
+
model_id: seraena
|
| 26 |
+
channels: 3
|
| 27 |
+
latent_channels: 16
|
| 28 |
+
ch_0: 64
|
| 29 |
+
sample_size:
|
| 30 |
+
- 360
|
| 31 |
+
- 640
|
| 32 |
+
train:
|
| 33 |
+
trainer_id: distill_dec_seraena
|
| 34 |
+
data_id: video_dir_loader
|
| 35 |
+
data_kwargs:
|
| 36 |
+
source:
|
| 37 |
+
- /mnt/data/datasets/extracted_tars/kbm/fps/*/*.mp4
|
| 38 |
+
- /mnt/data/datasets/extracted_tars/kbm/3ps/*/*.mp4
|
| 39 |
+
- /mnt/data/datasets/extracted_tars/kbm/other/*/*.mp4
|
| 40 |
+
target_size:
|
| 41 |
+
- 360
|
| 42 |
+
- 640
|
| 43 |
+
target_batch_size: 256
|
| 44 |
+
batch_size: 32
|
| 45 |
+
epochs: 200
|
| 46 |
+
opt: AdamW
|
| 47 |
+
opt_kwargs:
|
| 48 |
+
lr: 0.0001
|
| 49 |
+
weight_decay: 0.0001
|
| 50 |
+
betas:
|
| 51 |
+
- 0.9
|
| 52 |
+
- 0.95
|
| 53 |
+
eps: 1.0e-15
|
| 54 |
+
lpips_type: convnext
|
| 55 |
+
loss_weights:
|
| 56 |
+
lpips: 12.0
|
| 57 |
+
l2: 1.0
|
| 58 |
+
gan: 0.5
|
| 59 |
+
dwt: 0.0
|
| 60 |
+
scheduler: LinearWarmupWithCosineDecay
|
| 61 |
+
scheduler_kwargs:
|
| 62 |
+
warmup_steps: 1000
|
| 63 |
+
decay_after: 120000
|
| 64 |
+
decay_steps: 220000
|
| 65 |
+
start_mult: 0.1
|
| 66 |
+
decay_to_mult: 0.1
|
| 67 |
+
checkpoint_dir: checkpoints/waypoint_1_vae_owlc_f16_c16_dec_distill_adv_fix
|
| 68 |
+
resume_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16_dec_distill/step_5000.pt
|
| 69 |
+
encoder_cfg: configs/waypoint_1/owl_vae_f16_c16_enc_distill.yml
|
| 70 |
+
encoder_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16_enc_distill/step_110000.pt
|
| 71 |
+
teacher_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16/step_300000.pt
|
| 72 |
+
teacher_cfg: configs/waypoint_1/owl_vae_f16_c16.yml
|
| 73 |
+
sample_interval: 1000
|
| 74 |
+
save_interval: 5000
|
| 75 |
+
latent_scale: 1.0
|
| 76 |
+
latent_shift: 0.0
|
| 77 |
+
delay_adv: 5000
|
| 78 |
+
warmup_adv: 2000
|
| 79 |
+
wandb:
|
| 80 |
+
name: shahbuland
|
| 81 |
+
project: new_vaes_v2
|
| 82 |
+
run_name: waypoint_1_vae_owlc_f16_c16_dec_distill
|
encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:364680dc0902b61ff6b836a7f88cccdbfc522f13e3cbf2286b342a4aff048d8d
|
| 3 |
+
size 5674296
|
encoder_conf.yml
ADDED
|
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model:
|
| 2 |
+
model_id: dcae
|
| 3 |
+
sample_size:
|
| 4 |
+
- 360
|
| 5 |
+
- 640
|
| 6 |
+
channels: 3
|
| 7 |
+
latent_size: 32
|
| 8 |
+
latent_channels: 16
|
| 9 |
+
ch_0: 64
|
| 10 |
+
ch_max: 256
|
| 11 |
+
encoder_blocks_per_stage:
|
| 12 |
+
- 1
|
| 13 |
+
- 1
|
| 14 |
+
- 1
|
| 15 |
+
- 1
|
| 16 |
+
decoder_blocks_per_stage:
|
| 17 |
+
- 1
|
| 18 |
+
- 1
|
| 19 |
+
- 1
|
| 20 |
+
- 1
|
| 21 |
+
use_middle_block: false
|
| 22 |
+
do_channel_mask: false
|
| 23 |
+
skip_logvar: false
|
| 24 |
+
train:
|
| 25 |
+
trainer_id: distill_enc
|
| 26 |
+
data_id: video_dir_loader
|
| 27 |
+
data_kwargs:
|
| 28 |
+
source:
|
| 29 |
+
- /mnt/data/datasets/extracted_tars/kbm/fps/*/*.mp4
|
| 30 |
+
- /mnt/data/datasets/extracted_tars/kbm/3ps/*/*.mp4
|
| 31 |
+
- /mnt/data/datasets/extracted_tars/kbm/other/*/*.mp4
|
| 32 |
+
target_size:
|
| 33 |
+
- 360
|
| 34 |
+
- 640
|
| 35 |
+
target_batch_size: 256
|
| 36 |
+
batch_size: 32
|
| 37 |
+
epochs: 200
|
| 38 |
+
opt: Muon
|
| 39 |
+
opt_kwargs:
|
| 40 |
+
lr: 0.0005
|
| 41 |
+
momentum: 0.95
|
| 42 |
+
adamw_lr: 0.0001
|
| 43 |
+
adamw_wd: 0.01
|
| 44 |
+
adamw_eps: 1.0e-06
|
| 45 |
+
adamw_betas:
|
| 46 |
+
- 0.9
|
| 47 |
+
- 0.95
|
| 48 |
+
adamw_keys:
|
| 49 |
+
- conv_in
|
| 50 |
+
- conv_out
|
| 51 |
+
- conv_out_logvar
|
| 52 |
+
- .down.
|
| 53 |
+
- .residuals.
|
| 54 |
+
lpips_type: convnext
|
| 55 |
+
loss_weights:
|
| 56 |
+
l2: 1.0
|
| 57 |
+
logvar: 1.0
|
| 58 |
+
scheduler: LinearWarmup
|
| 59 |
+
scheduler_kwargs:
|
| 60 |
+
warmup_steps: 1500
|
| 61 |
+
min_lr: 1.0e-05
|
| 62 |
+
checkpoint_dir: checkpoints/waypoint_1_vae_owlc_f16_c16_enc_distill
|
| 63 |
+
resume_ckpt: null
|
| 64 |
+
teacher_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16/step_300000.pt
|
| 65 |
+
teacher_cfg: configs/waypoint_1/owl_vae_f16_c16.yml
|
| 66 |
+
sample_interval: 1000
|
| 67 |
+
save_interval: 5000
|
| 68 |
+
latent_scale: 1.0
|
| 69 |
+
latent_shift: 0.0
|
| 70 |
+
wandb:
|
| 71 |
+
name: shahbuland
|
| 72 |
+
project: new_vaes_v2
|
| 73 |
+
run_name: waypoint_1_vae_owlc_f16_c16_enc_distill_highlr
|