shahbuland commited on
Commit
ba93215
·
verified ·
1 Parent(s): ec3c512

Upload folder using huggingface_hub

Browse files
decoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33bc72089283767d00ffc85eac8beca3f5c4158c1049ba44f3e93a188c5de6bb
3
+ size 278084696
decoder_conf.yml ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ model_id: dcae
3
+ sample_size:
4
+ - 360
5
+ - 640
6
+ channels: 3
7
+ latent_size: 32
8
+ latent_channels: 16
9
+ ch_0: 128
10
+ ch_max: 1024
11
+ encoder_blocks_per_stage:
12
+ - 1
13
+ - 1
14
+ - 1
15
+ - 1
16
+ decoder_blocks_per_stage:
17
+ - 1
18
+ - 1
19
+ - 1
20
+ - 1
21
+ use_middle_block: false
22
+ do_channel_mask: false
23
+ skip_logvar: false
24
+ discriminator:
25
+ model_id: seraena
26
+ channels: 3
27
+ latent_channels: 16
28
+ ch_0: 64
29
+ sample_size:
30
+ - 360
31
+ - 640
32
+ train:
33
+ trainer_id: distill_dec_seraena
34
+ data_id: video_dir_loader
35
+ data_kwargs:
36
+ source:
37
+ - /mnt/data/datasets/extracted_tars/kbm/fps/*/*.mp4
38
+ - /mnt/data/datasets/extracted_tars/kbm/3ps/*/*.mp4
39
+ - /mnt/data/datasets/extracted_tars/kbm/other/*/*.mp4
40
+ target_size:
41
+ - 360
42
+ - 640
43
+ target_batch_size: 256
44
+ batch_size: 32
45
+ epochs: 200
46
+ opt: AdamW
47
+ opt_kwargs:
48
+ lr: 0.0001
49
+ weight_decay: 0.0001
50
+ betas:
51
+ - 0.9
52
+ - 0.95
53
+ eps: 1.0e-15
54
+ lpips_type: convnext
55
+ loss_weights:
56
+ lpips: 12.0
57
+ l2: 1.0
58
+ gan: 0.5
59
+ dwt: 0.0
60
+ scheduler: LinearWarmupWithCosineDecay
61
+ scheduler_kwargs:
62
+ warmup_steps: 1000
63
+ decay_after: 120000
64
+ decay_steps: 220000
65
+ start_mult: 0.1
66
+ decay_to_mult: 0.1
67
+ checkpoint_dir: checkpoints/waypoint_1_vae_owlc_f16_c16_dec_distill_adv_fix
68
+ resume_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16_dec_distill/step_5000.pt
69
+ encoder_cfg: configs/waypoint_1/owl_vae_f16_c16_enc_distill.yml
70
+ encoder_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16_enc_distill/step_110000.pt
71
+ teacher_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16/step_300000.pt
72
+ teacher_cfg: configs/waypoint_1/owl_vae_f16_c16.yml
73
+ sample_interval: 1000
74
+ save_interval: 5000
75
+ latent_scale: 1.0
76
+ latent_shift: 0.0
77
+ delay_adv: 5000
78
+ warmup_adv: 2000
79
+ wandb:
80
+ name: shahbuland
81
+ project: new_vaes_v2
82
+ run_name: waypoint_1_vae_owlc_f16_c16_dec_distill
encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:364680dc0902b61ff6b836a7f88cccdbfc522f13e3cbf2286b342a4aff048d8d
3
+ size 5674296
encoder_conf.yml ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ model_id: dcae
3
+ sample_size:
4
+ - 360
5
+ - 640
6
+ channels: 3
7
+ latent_size: 32
8
+ latent_channels: 16
9
+ ch_0: 64
10
+ ch_max: 256
11
+ encoder_blocks_per_stage:
12
+ - 1
13
+ - 1
14
+ - 1
15
+ - 1
16
+ decoder_blocks_per_stage:
17
+ - 1
18
+ - 1
19
+ - 1
20
+ - 1
21
+ use_middle_block: false
22
+ do_channel_mask: false
23
+ skip_logvar: false
24
+ train:
25
+ trainer_id: distill_enc
26
+ data_id: video_dir_loader
27
+ data_kwargs:
28
+ source:
29
+ - /mnt/data/datasets/extracted_tars/kbm/fps/*/*.mp4
30
+ - /mnt/data/datasets/extracted_tars/kbm/3ps/*/*.mp4
31
+ - /mnt/data/datasets/extracted_tars/kbm/other/*/*.mp4
32
+ target_size:
33
+ - 360
34
+ - 640
35
+ target_batch_size: 256
36
+ batch_size: 32
37
+ epochs: 200
38
+ opt: Muon
39
+ opt_kwargs:
40
+ lr: 0.0005
41
+ momentum: 0.95
42
+ adamw_lr: 0.0001
43
+ adamw_wd: 0.01
44
+ adamw_eps: 1.0e-06
45
+ adamw_betas:
46
+ - 0.9
47
+ - 0.95
48
+ adamw_keys:
49
+ - conv_in
50
+ - conv_out
51
+ - conv_out_logvar
52
+ - .down.
53
+ - .residuals.
54
+ lpips_type: convnext
55
+ loss_weights:
56
+ l2: 1.0
57
+ logvar: 1.0
58
+ scheduler: LinearWarmup
59
+ scheduler_kwargs:
60
+ warmup_steps: 1500
61
+ min_lr: 1.0e-05
62
+ checkpoint_dir: checkpoints/waypoint_1_vae_owlc_f16_c16_enc_distill
63
+ resume_ckpt: null
64
+ teacher_ckpt: checkpoints/waypoint_1_vae_owlc_f16_c16/step_300000.pt
65
+ teacher_cfg: configs/waypoint_1/owl_vae_f16_c16.yml
66
+ sample_interval: 1000
67
+ save_interval: 5000
68
+ latent_scale: 1.0
69
+ latent_shift: 0.0
70
+ wandb:
71
+ name: shahbuland
72
+ project: new_vaes_v2
73
+ run_name: waypoint_1_vae_owlc_f16_c16_enc_distill_highlr