abzal-glw commited on
Commit
28cc3d2
·
verified ·
1 Parent(s): 0da62fc

Upload terramind_v3_pretrain_warm/config.yaml with huggingface_hub

Browse files
terramind_v3_pretrain_warm/config.yaml ADDED
@@ -0,0 +1,117 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ augment: true
3
+ batch_size: 8
4
+ block_buffer_deg: 0.02
5
+ block_salt: cryosentinel-blocks-v1
6
+ block_size_deg: 0.25
7
+ copy_paste:
8
+ min_donor_water_pixels: 32
9
+ p: 0.3
10
+ sub_sample_frac: 1.0
11
+ data_dir: /tmp/multimodal_chips_v3
12
+ hard_neg_sampler:
13
+ positive_to_negative_ratio: 3.0
14
+ replacement: true
15
+ hard_neg_water_frac_threshold: 0.002
16
+ include_unknown_in_train: true
17
+ mosaic:
18
+ jitter: 0.2
19
+ p: 0.15
20
+ multi_scale:
21
+ p: 0.5
22
+ scale_max: 1.25
23
+ scale_min: 0.75
24
+ norm_stats_path: /tmp/multimodal_chips_v3/dataset_stats_v3.json
25
+ num_workers: 0
26
+ persistent_workers: false
27
+ pin_memory: false
28
+ regions:
29
+ - hindu_kush
30
+ - pamir
31
+ - karakoram
32
+ - western_himalaya
33
+ - central_himalaya
34
+ - eastern_himalaya
35
+ - hengduan_nyainqentanglha
36
+ - tibetan_plateau
37
+ - hma_other
38
+ - tien_shan_full
39
+ - ile_alatau
40
+ - zhetysu_alatau
41
+ rot90: false
42
+ shard_cache_size: 200
43
+ shuffle_train: true
44
+ spectral_jitter:
45
+ eps_dem: 0.02
46
+ eps_s1: 0.1
47
+ eps_s2: 0.05
48
+ p: 0.5
49
+ use_block_split: true
50
+ years:
51
+ - 2017
52
+ - 2021
53
+ - 2022
54
+ - 2023
55
+ model:
56
+ backbone: terramind_v1_large
57
+ backbone_lr_mult: 0.1
58
+ backbone_pretrained: true
59
+ compile_model: true
60
+ decoder: UperNetDecoder
61
+ decoder_kwargs:
62
+ decoder_channels: 256
63
+ decoder_scale_modules: true
64
+ dice_variant: generalized
65
+ focal_alpha: 0.25
66
+ focal_gamma: 2.0
67
+ freeze_backbone_layers: 0
68
+ label_smoothing: 0.1
69
+ llrd_decay: 0.75
70
+ loss_type: mega
71
+ lovasz_per_image: true
72
+ lr: 3.0e-05
73
+ modalities:
74
+ - S2L2A
75
+ - S1GRD
76
+ - DEM
77
+ ohem_keep_ratio: 0.5
78
+ ohem_min_kept: 4096
79
+ pos_weight_max: 100.0
80
+ test_tta: true
81
+ tversky_alpha: 0.3
82
+ tversky_beta: 0.7
83
+ val_tta: true
84
+ w_bce: 0.5
85
+ w_boundary: 0.5
86
+ w_dice: 1.0
87
+ w_focal: 1.0
88
+ w_lovasz: 0.3
89
+ w_tversky: 0.5
90
+ weight_decay: 0.0001
91
+ output_dir: /ckpts
92
+ run_name: terramind_v3_pretrain_warm
93
+ run_test: true
94
+ seed: 42
95
+ trainer:
96
+ accelerator: gpu
97
+ accumulate_grad_batches: 2
98
+ check_val_every_n_epoch: 1
99
+ checkpoint_every_n_steps: 500
100
+ devices: 1
101
+ early_stopping_patience: 5
102
+ ema:
103
+ apply_at_test: true
104
+ apply_at_validation: true
105
+ cpu_shadow: true
106
+ decay: 0.999
107
+ skip_buffers: true
108
+ gradient_clip_val: 1.0
109
+ hf_push:
110
+ every_n_epochs: 1
111
+ every_n_train_steps: 500
112
+ push_best_too: true
113
+ repo_id: abzal-glw/cryosentinel-terramind-v3
114
+ run_name: terramind_v3_pretrain_warm
115
+ log_every_n_steps: 25
116
+ max_epochs: 6
117
+ precision: bf16-mixed