Upload ./config.json with huggingface_hub
Browse files- config.json +191 -0
config.json
ADDED
@@ -0,0 +1,191 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
AMP_ENABLE: true
|
2 |
+
AMP_OPT_LEVEL: ''
|
3 |
+
AUG:
|
4 |
+
AUTO_AUGMENT: rand-m9-mstd0.5-inc1
|
5 |
+
COLOR_JITTER: 0.4
|
6 |
+
CUTMIX: 1.0
|
7 |
+
CUTMIX_MINMAX: null
|
8 |
+
MIXUP: 0.8
|
9 |
+
MIXUP_MODE: batch
|
10 |
+
MIXUP_PROB: 1.0
|
11 |
+
MIXUP_SWITCH_PROB: 0.5
|
12 |
+
RECOUNT: 1
|
13 |
+
REMODE: pixel
|
14 |
+
REPROB: 0.25
|
15 |
+
BASE:
|
16 |
+
- ''
|
17 |
+
DATA:
|
18 |
+
BATCH_SIZE: 128
|
19 |
+
CACHE_MODE: part
|
20 |
+
DATASET: EEG
|
21 |
+
DATA_PATH: /root/zym/HMS/eva
|
22 |
+
IMG_SIZE: 224
|
23 |
+
INTERPOLATION: bicubic
|
24 |
+
MASK_PATCH_SIZE: 32
|
25 |
+
MASK_RATIO: 0.6
|
26 |
+
NUM_WORKERS: 8
|
27 |
+
PIN_MEMORY: true
|
28 |
+
ZIP_MODE: false
|
29 |
+
ENABLE_AMP: false
|
30 |
+
EVAL_MODE: true
|
31 |
+
FUSED_LAYERNORM: false
|
32 |
+
FUSED_WINDOW_PROCESS: false
|
33 |
+
LOCAL_RANK: 0
|
34 |
+
MODEL:
|
35 |
+
DROP_PATH_RATE: 0.2
|
36 |
+
DROP_RATE: 0.0
|
37 |
+
LABEL_SMOOTHING: 0.1
|
38 |
+
NAME: swin_large_patch4_window7_224_22k
|
39 |
+
NUM_CLASSES: 1000
|
40 |
+
PRETRAINED: ''
|
41 |
+
RESUME: ./output/swin_large_patch4_window7_224_22k/default/ckpt_epoch_89.pth
|
42 |
+
SIMMIM:
|
43 |
+
NORM_TARGET:
|
44 |
+
ENABLE: false
|
45 |
+
PATCH_SIZE: 47
|
46 |
+
SWIN:
|
47 |
+
APE: false
|
48 |
+
DEPTHS:
|
49 |
+
- 2
|
50 |
+
- 2
|
51 |
+
- 18
|
52 |
+
- 2
|
53 |
+
EMBED_DIM: 192
|
54 |
+
IN_CHANS: 3
|
55 |
+
MLP_RATIO: 4.0
|
56 |
+
NUM_HEADS:
|
57 |
+
- 6
|
58 |
+
- 12
|
59 |
+
- 24
|
60 |
+
- 48
|
61 |
+
PATCH_NORM: true
|
62 |
+
PATCH_SIZE: 4
|
63 |
+
QKV_BIAS: true
|
64 |
+
QK_SCALE: null
|
65 |
+
WINDOW_SIZE: 7
|
66 |
+
SWINV2:
|
67 |
+
APE: false
|
68 |
+
DEPTHS:
|
69 |
+
- 2
|
70 |
+
- 2
|
71 |
+
- 6
|
72 |
+
- 2
|
73 |
+
EMBED_DIM: 96
|
74 |
+
IN_CHANS: 3
|
75 |
+
MLP_RATIO: 4.0
|
76 |
+
NUM_HEADS:
|
77 |
+
- 3
|
78 |
+
- 6
|
79 |
+
- 12
|
80 |
+
- 24
|
81 |
+
PATCH_NORM: true
|
82 |
+
PATCH_SIZE: 4
|
83 |
+
PRETRAINED_WINDOW_SIZES:
|
84 |
+
- 0
|
85 |
+
- 0
|
86 |
+
- 0
|
87 |
+
- 0
|
88 |
+
QKV_BIAS: true
|
89 |
+
WINDOW_SIZE: 7
|
90 |
+
SWIN_MLP:
|
91 |
+
APE: false
|
92 |
+
DEPTHS:
|
93 |
+
- 2
|
94 |
+
- 2
|
95 |
+
- 6
|
96 |
+
- 2
|
97 |
+
EMBED_DIM: 96
|
98 |
+
IN_CHANS: 3
|
99 |
+
MLP_RATIO: 4.0
|
100 |
+
NUM_HEADS:
|
101 |
+
- 3
|
102 |
+
- 6
|
103 |
+
- 12
|
104 |
+
- 24
|
105 |
+
PATCH_NORM: true
|
106 |
+
PATCH_SIZE: 4
|
107 |
+
WINDOW_SIZE: 7
|
108 |
+
SWIN_MOE:
|
109 |
+
APE: false
|
110 |
+
AUX_LOSS_WEIGHT: 0.01
|
111 |
+
CAPACITY_FACTOR: 1.25
|
112 |
+
COSINE_ROUTER: false
|
113 |
+
COSINE_ROUTER_DIM: 256
|
114 |
+
COSINE_ROUTER_INIT_T: 0.5
|
115 |
+
DEPTHS:
|
116 |
+
- 2
|
117 |
+
- 2
|
118 |
+
- 6
|
119 |
+
- 2
|
120 |
+
EMBED_DIM: 96
|
121 |
+
GATE_NOISE: 1.0
|
122 |
+
INIT_STD: 0.02
|
123 |
+
IN_CHANS: 3
|
124 |
+
IS_GSHARD_LOSS: false
|
125 |
+
MLP_FC2_BIAS: true
|
126 |
+
MLP_RATIO: 4.0
|
127 |
+
MOE_BLOCKS:
|
128 |
+
- - -1
|
129 |
+
- - -1
|
130 |
+
- - -1
|
131 |
+
- - -1
|
132 |
+
MOE_DROP: 0.0
|
133 |
+
NORMALIZE_GATE: false
|
134 |
+
NUM_HEADS:
|
135 |
+
- 3
|
136 |
+
- 6
|
137 |
+
- 12
|
138 |
+
- 24
|
139 |
+
NUM_LOCAL_EXPERTS: 1
|
140 |
+
PATCH_NORM: true
|
141 |
+
PATCH_SIZE: 4
|
142 |
+
PRETRAINED_WINDOW_SIZES:
|
143 |
+
- 0
|
144 |
+
- 0
|
145 |
+
- 0
|
146 |
+
- 0
|
147 |
+
QKV_BIAS: true
|
148 |
+
QK_SCALE: null
|
149 |
+
TOP_VALUE: 1
|
150 |
+
USE_BPR: true
|
151 |
+
WINDOW_SIZE: 7
|
152 |
+
TYPE: swin
|
153 |
+
OUTPUT: output/swin_large_patch4_window7_224_22k/default
|
154 |
+
PRINT_FREQ: 10
|
155 |
+
SAVE_FREQ: 1
|
156 |
+
SEED: 0
|
157 |
+
TAG: default
|
158 |
+
TEST:
|
159 |
+
CROP: true
|
160 |
+
SEQUENTIAL: false
|
161 |
+
SHUFFLE: false
|
162 |
+
THROUGHPUT_MODE: false
|
163 |
+
TRAIN:
|
164 |
+
ACCUMULATION_STEPS: 1
|
165 |
+
AUTO_RESUME: true
|
166 |
+
BASE_LR: 3.125e-05
|
167 |
+
CLIP_GRAD: 5.0
|
168 |
+
EPOCHS: 90
|
169 |
+
LAYER_DECAY: 1.0
|
170 |
+
LR_SCHEDULER:
|
171 |
+
DECAY_EPOCHS: 30
|
172 |
+
DECAY_RATE: 0.1
|
173 |
+
GAMMA: 0.1
|
174 |
+
MULTISTEPS: []
|
175 |
+
NAME: cosine
|
176 |
+
WARMUP_PREFIX: true
|
177 |
+
MIN_LR: 3.125e-07
|
178 |
+
MOE:
|
179 |
+
SAVE_MASTER: false
|
180 |
+
OPTIMIZER:
|
181 |
+
BETAS:
|
182 |
+
- 0.9
|
183 |
+
- 0.999
|
184 |
+
EPS: 1.0e-08
|
185 |
+
MOMENTUM: 0.9
|
186 |
+
NAME: adamw
|
187 |
+
START_EPOCH: 0
|
188 |
+
USE_CHECKPOINT: false
|
189 |
+
WARMUP_EPOCHS: 5
|
190 |
+
WARMUP_LR: 3.125e-08
|
191 |
+
WEIGHT_DECAY: 0.05
|