Haroon commited on
Commit
48c8cb4
·
verified ·
1 Parent(s): 0c7b693

Upload folder using huggingface_hub

Browse files
medimageinsight/config.yaml ADDED
@@ -0,0 +1,211 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ##################
2
+ # Trainer settings
3
+ ##################
4
+
5
+
6
+ TASK: UniCLTask
7
+
8
+ NAME: 'Example Eval Configuration'
9
+ SAVE_TIMER_LOG: true
10
+
11
+ # TUTORIAL STEP 1: CHOOSE SAVE DIR
12
+ SAVE_DIR: ''
13
+ LOG_EVERY: 10
14
+ LOGLEVEL_OVERRIDE: INFO
15
+ LOG_GPU_MEM: true
16
+ RESUME: False
17
+ RESET_DATA_LOADER: false
18
+
19
+ FP16: true
20
+ ZERO_STAGE: 0
21
+ DEEPSPEED: false
22
+ # ZERO_STAGE: 1
23
+ AMP: PYTORCH
24
+ # USE_APEX_DDP: false
25
+ # USE_APEX_AMP: false
26
+ # USE_HIT: false
27
+
28
+ FIND_UNUSED_PARAMETERS: false
29
+
30
+ SAVE_PER_OPTIM_STEPS: 500
31
+ EVAL_PER_OPTIM_STEPS: 250
32
+ EVAL_AT_START: False
33
+ # SAVE_PER_UPDATE_NUM: -1
34
+ # EVAL_PER_UPDATE_NUM: 0 # 0: do evaluation when saving checkpoint, -1: don't do evaluation
35
+
36
+ NO_AUTO_LR_SCALING: true
37
+ GRAD_CLIPPING: 1.0 #0.07
38
+
39
+ SET_SAMPLER_EPOCH: true
40
+
41
+ DONT_LOAD_MODEL: true
42
+
43
+ user_dir: "./MainzVision" # lower case due to it is used in mainz as such
44
+
45
+ ##################
46
+ # Task settings
47
+ ##################
48
+
49
+
50
+
51
+ VERBOSE: true
52
+ WORKERS: 6
53
+ PIN_MEMORY: true
54
+ IMAGE_ENCODER:
55
+ NAME: davit_v1
56
+ NUM_CLASSES: 0
57
+ #IMAGE_SIZE: [384, 384]
58
+ IMAGE_SIZE: [480, 480]
59
+ LOAD_PRETRAINED: true
60
+ PRETRAINED: ''
61
+ PRETRAINED_LAYERS: '*'
62
+ IMAGE_MEAN: [0.485, 0.456, 0.406]
63
+ IMAGE_STD: [0.229, 0.224, 0.225]
64
+ SPEC:
65
+ DROP_RATE: 0.1
66
+ DROP_PATH_RATE: 0.2
67
+ PATCH_SIZE: [7, 3, 3, 3]
68
+ PATCH_STRIDE: [4, 2, 2, 2]
69
+ PATCH_PADDING: [3, 1, 1, 1]
70
+ PATCH_PRENORM: [false, true, true, true]
71
+ DIM_EMBED: [256, 512, 1024, 2048]
72
+ NUM_HEADS: [8, 16, 32, 64]
73
+ NUM_GROUPS: [8, 16, 32, 64]
74
+ DEPTHS: [1, 1, 9, 1]
75
+ WINDOW_SIZE: 12
76
+ ENABLE_CHECKPOINT: true
77
+
78
+ LANG_ENCODER:
79
+ NAME: transformer
80
+ LOAD_PRETRAINED: false
81
+ PRETRAINED: ''
82
+ PRETRAINED_LAYERS: '*'
83
+ TOKENIZER: clip
84
+ CONTEXT_LENGTH: 77
85
+ WIDTH: 1024
86
+ HEADS: 16
87
+ LAYERS: 16
88
+ AUTOGRESSIVE: false
89
+
90
+ UNICL_MODEL:
91
+ DIM_PROJECTION: 1024
92
+ GATHER_TENSORS: true
93
+ LOAD_PRETRAINED: true
94
+
95
+ # TUTORIAL STEP 2: CHOOSE MODEL PATH
96
+ PRETRAINED: ''
97
+
98
+ PRETRAINED_LAYERS: '*'
99
+
100
+ AUG:
101
+ MIXUP_PROB: 0.0
102
+ MIXUP: 0.8
103
+ MIXCUT: 1.0
104
+ MIXCUT_MINMAX: []
105
+ MIXUP_SWITCH_PROB: 0.5
106
+ MIXUP_MODE: 'batch'
107
+ SCALE: [0.8, 1.0]
108
+ RATIO: [0.75, 1.3333333]
109
+ INTERPOLATION: 'bicubic'
110
+ TORCHVISION_AUG:
111
+ AUTO_AUGMENT: ta_wide
112
+ RE_PROB: 0.25
113
+ HFLIP: 0.0
114
+ VFLIP: 0.0
115
+
116
+ LOSS:
117
+ LOSS: UniCL
118
+ DATASET:
119
+ DATASET: 'image_text_pairs_v2'
120
+ TEXT_FORMAT: 'json'
121
+ ROOT: ''
122
+ TRAIN_SET: 'mimic_cxr_v2-chestxray14-chexpertv4-irma2009_v2-rsnaboneage-mura-bingmedicalfewshot'
123
+ DATA_FORMAT: 'tsv'
124
+ SAMPLER: 'default'
125
+ LOADER: 'default'
126
+ TOKEN_FILE: ''
127
+ #PROMPT_ENGINEERING: False
128
+ #SAMPLER: 'chunk'
129
+ #LOADER: 'azcopy'
130
+ #TOKEN_FILE: 'cliptrainingpairs.txt'
131
+ #TEST_SET: 'MarsAtrain'
132
+
133
+
134
+ # TUTORIAL STEP 3: CHOOSE ALL BELOW EVAL PATHS (THESE ARE ALL OPTIONAL EXTRA EVALS)
135
+ # Note how one eval is ZIP format and the other is TSV format.
136
+
137
+
138
+
139
+
140
+ EVALDATASET_LTCXR_S100_N100_TEXT_CLASSIFIER:
141
+ TEXT_FORMAT: json
142
+ FORMAT: 'zip'
143
+ SPLIT: 'NIH-CXR-LT'
144
+ ZIP_FILE: ''
145
+ ZIP_MAP_FILE: ''
146
+ LABEL_FILE: ''
147
+ IMAGE_TSV: ''
148
+ TEXT_TSV: ''
149
+ CWEIGHT_FILE: ''
150
+ ZS_MODE: 2
151
+ ZS_WEIGHT: 1.0
152
+ KNN: 100
153
+ # CLASSIFICATION_SETS: ['NIH-CXR-LT']
154
+ # NUM_CLASSES: [20]
155
+
156
+
157
+
158
+
159
+ # TUTORIAL STEP 4: SET THE DEFAULT ZEROSHOT EVAL (THIS IS THE MANDATORY EVAL)
160
+
161
+ ZEROSHOT_EVAL_DATASET:
162
+ FORMAT: 'zip'
163
+ SPLIT: 'NIH-CXR-LT'
164
+ ZIP_FILE: ''
165
+ ZIP_MAP_FILE: ''
166
+ LABEL_FILE: ''
167
+
168
+
169
+
170
+ EVALUATION_SPLITS: ['cls-zeroshot-eval']
171
+ TEST:
172
+ BATCH_SIZE_PER_GPU: 8
173
+ MODEL_FILE: ''
174
+ CENTER_CROP: false
175
+ TRAIN:
176
+ BATCH_SIZE_TOTAL: 1024
177
+ BATCH_SIZE_PER_GPU: 16
178
+
179
+ SHUFFLE: true
180
+
181
+ WEIGHT_SMOOTHING:
182
+ decay: 0.999
183
+ use_cpu: False
184
+ eval_smoothed_weight: True
185
+
186
+ START_LEARNING_RATE: 0.00001
187
+ # MAX_NUM_EPOCHS: 2
188
+ MAX_NUM_EPOCHS: 100
189
+ OPTIMIZER: AdamW # adam
190
+ OPTIMIZER_PARAMS:
191
+ weight_decay: 0.2 #0.1
192
+ CUSTOMIZED_PARAMS_CONF:
193
+ NO_WEIGHT_DECAY_MODULES: ['dw', 'norm']
194
+ WEIGHT_DECAY_PATTERNS:
195
+ "\\.bias$": 0.0
196
+ "logit_scale": 0.0
197
+ "positional_embedding": 0.0
198
+ "token_embedding": 0.0
199
+
200
+
201
+
202
+ LR_SCHEDULER: TimmScheduler
203
+ LR_SCHEDULER_PARAMS:
204
+ sched: cosine
205
+ warmup_steps: 5
206
+ warmup_lr: 0.000000001
207
+ min_lr: 0.000000001
208
+
209
+ # GRADIENT_ACCUMULATE_STEP will be updated by:
210
+ # BATCH_SIZE_TOTAL // (BATCH_SIZE_PER_GPU * world_size)
211
+ GRADIENT_ACCUMULATE_STEP: -1
medimageinsight/language_model/clip_tokenizer_4.16.2/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
medimageinsight/language_model/clip_tokenizer_4.16.2/special_tokens_map.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "single_word": false,
5
+ "lstrip": false,
6
+ "rstrip": false,
7
+ "normalized": true,
8
+ "special": false
9
+ },
10
+ "eos_token": {
11
+ "content": "<|endoftext|>",
12
+ "single_word": false,
13
+ "lstrip": false,
14
+ "rstrip": false,
15
+ "normalized": true,
16
+ "special": false
17
+ },
18
+ "unk_token": {
19
+ "content": "<|endoftext|>",
20
+ "single_word": false,
21
+ "lstrip": false,
22
+ "rstrip": false,
23
+ "normalized": true,
24
+ "special": false
25
+ },
26
+ "pad_token": "<|endoftext|>"
27
+ }
medimageinsight/language_model/clip_tokenizer_4.16.2/tokenizer_config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "errors": "replace",
3
+ "unk_token": {
4
+ "content": "<|endoftext|>",
5
+ "single_word": false,
6
+ "lstrip": false,
7
+ "rstrip": false,
8
+ "normalized": true,
9
+ "special": false,
10
+ "__type": "AddedToken"
11
+ },
12
+ "bos_token": {
13
+ "content": "<|startoftext|>",
14
+ "single_word": false,
15
+ "lstrip": false,
16
+ "rstrip": false,
17
+ "normalized": true,
18
+ "special": false,
19
+ "__type": "AddedToken"
20
+ },
21
+ "eos_token": {
22
+ "content": "<|endoftext|>",
23
+ "single_word": false,
24
+ "lstrip": false,
25
+ "rstrip": false,
26
+ "normalized": true,
27
+ "special": false,
28
+ "__type": "AddedToken"
29
+ },
30
+ "pad_token": "<|endoftext|>",
31
+ "add_prefix_space": false,
32
+ "do_lower_case": true,
33
+ "name_or_path": "openai/clip-vit-base-patch32",
34
+ "model_max_length": 77,
35
+ "special_tokens_map_file": "/home/ncodella/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
36
+ "tokenizer_file": "/home/ncodella/.cache/huggingface/transformers/7811def0c53be25ba790cb67ac785669b508a8d1cf8c912b8ac046c5f08aee68.20428ea8b6821af2719b760af844a371643ff49f255c73285f6ea448e15597fe",
37
+ "tokenizer_class": "CLIPTokenizer"
38
+ }
medimageinsight/language_model/clip_tokenizer_4.16.2/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
medimageinsight/vision_model/medimageinsigt-v1.0.0-001.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eeda63bf616a61664bc95b2c09d3b3d7125209e635678bd3f5f324e9bdb1414
3
+ size 2464060700