abzal-glw commited on
Commit
8472eef
·
verified ·
1 Parent(s): 3034ee0

Upload terramind_v3_finetune_almaty/config.yaml with huggingface_hub

Browse files
terramind_v3_finetune_almaty/config.yaml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ augment: true
3
+ batch_size: 8
4
+ block_buffer_deg: 0.02
5
+ block_salt: cryosentinel-blocks-v1
6
+ block_size_deg: 0.25
7
+ copy_paste:
8
+ min_donor_water_pixels: 32
9
+ p: 0.2
10
+ sub_sample_frac: 1.0
11
+ data_dir: /tmp/multimodal_chips_v3
12
+ hard_neg_sampler:
13
+ positive_to_negative_ratio: 3.0
14
+ replacement: true
15
+ hard_neg_water_frac_threshold: 0.002
16
+ include_unknown_in_train: true
17
+ multi_scale:
18
+ p: 0.5
19
+ scale_max: 1.25
20
+ scale_min: 0.75
21
+ norm_stats_path: /tmp/multimodal_chips_v3/dataset_stats_v3.json
22
+ num_workers: 0
23
+ persistent_workers: false
24
+ pin_memory: false
25
+ regions:
26
+ - tien_shan_full
27
+ - ile_alatau
28
+ - zhetysu_alatau
29
+ rot90: false
30
+ shard_cache_size: 50
31
+ shuffle_train: true
32
+ spectral_jitter:
33
+ eps_dem: 0.02
34
+ eps_s1: 0.08
35
+ eps_s2: 0.04
36
+ p: 0.5
37
+ use_block_split: true
38
+ years:
39
+ - 2017
40
+ - 2021
41
+ - 2022
42
+ - 2023
43
+ model:
44
+ backbone: terramind_v1_large
45
+ backbone_lr_mult: 0.05
46
+ backbone_pretrained: true
47
+ compile_model: true
48
+ decoder: UperNetDecoder
49
+ decoder_kwargs:
50
+ decoder_channels: 256
51
+ decoder_scale_modules: true
52
+ dice_variant: generalized
53
+ focal_alpha: 0.25
54
+ focal_gamma: 2.0
55
+ freeze_backbone_layers: 6
56
+ label_smoothing: 0.1
57
+ llrd_decay: 0.85
58
+ loss_type: mega
59
+ lovasz_per_image: true
60
+ lr: 5.0e-05
61
+ modalities:
62
+ - S2L2A
63
+ - S1GRD
64
+ - DEM
65
+ ohem_keep_ratio: 0.7
66
+ ohem_min_kept: 2048
67
+ pos_weight_max: 200.0
68
+ test_tta: true
69
+ tversky_alpha: 0.25
70
+ tversky_beta: 0.75
71
+ val_tta: false
72
+ w_bce: 0.5
73
+ w_boundary: 0.5
74
+ w_dice: 1.0
75
+ w_focal: 1.0
76
+ w_lovasz: 0.3
77
+ w_tversky: 0.5
78
+ weight_decay: 0.0001
79
+ output_dir: /ckpts
80
+ run_name: terramind_v3_finetune_almaty
81
+ run_test: true
82
+ seed: 42
83
+ trainer:
84
+ accelerator: gpu
85
+ accumulate_grad_batches: 1
86
+ check_val_every_n_epoch: 1
87
+ checkpoint_every_n_steps: 500
88
+ devices: 1
89
+ early_stopping_patience: 6
90
+ ema:
91
+ apply_at_test: true
92
+ apply_at_validation: true
93
+ cpu_shadow: true
94
+ decay: 0.999
95
+ skip_buffers: true
96
+ gradient_clip_val: 1.0
97
+ hf_push:
98
+ every_n_epochs: 1
99
+ every_n_train_steps: 500
100
+ push_best_too: true
101
+ repo_id: abzal-glw/cryosentinel-terramind-v3
102
+ run_name: terramind_v3_finetune_almaty
103
+ log_every_n_steps: 25
104
+ max_epochs: 20
105
+ precision: bf16-mixed
106
+ swa:
107
+ annealing_epochs: 3
108
+ annealing_strategy: cos
109
+ swa_epoch_start: 0.75
110
+ swa_lrs: 1.0e-05