|
|
|
|
|
|
|
|
|
|
|
TASK: UniCLTask |
|
|
|
NAME: 'Example Eval Configuration' |
|
SAVE_TIMER_LOG: true |
|
|
|
|
|
SAVE_DIR: '' |
|
LOG_EVERY: 10 |
|
LOGLEVEL_OVERRIDE: INFO |
|
LOG_GPU_MEM: true |
|
RESUME: False |
|
RESET_DATA_LOADER: false |
|
|
|
FP16: true |
|
ZERO_STAGE: 0 |
|
DEEPSPEED: false |
|
|
|
AMP: PYTORCH |
|
|
|
|
|
|
|
|
|
FIND_UNUSED_PARAMETERS: false |
|
|
|
SAVE_PER_OPTIM_STEPS: 500 |
|
EVAL_PER_OPTIM_STEPS: 250 |
|
EVAL_AT_START: False |
|
|
|
|
|
|
|
NO_AUTO_LR_SCALING: true |
|
GRAD_CLIPPING: 1.0 |
|
|
|
SET_SAMPLER_EPOCH: true |
|
|
|
DONT_LOAD_MODEL: true |
|
|
|
user_dir: "./MainzVision" |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
VERBOSE: true |
|
WORKERS: 6 |
|
PIN_MEMORY: true |
|
IMAGE_ENCODER: |
|
NAME: davit_v1 |
|
NUM_CLASSES: 0 |
|
|
|
IMAGE_SIZE: [480, 480] |
|
LOAD_PRETRAINED: true |
|
PRETRAINED: '' |
|
PRETRAINED_LAYERS: '*' |
|
IMAGE_MEAN: [0.485, 0.456, 0.406] |
|
IMAGE_STD: [0.229, 0.224, 0.225] |
|
SPEC: |
|
DROP_RATE: 0.1 |
|
DROP_PATH_RATE: 0.2 |
|
PATCH_SIZE: [7, 3, 3, 3] |
|
PATCH_STRIDE: [4, 2, 2, 2] |
|
PATCH_PADDING: [3, 1, 1, 1] |
|
PATCH_PRENORM: [false, true, true, true] |
|
DIM_EMBED: [256, 512, 1024, 2048] |
|
NUM_HEADS: [8, 16, 32, 64] |
|
NUM_GROUPS: [8, 16, 32, 64] |
|
DEPTHS: [1, 1, 9, 1] |
|
WINDOW_SIZE: 12 |
|
ENABLE_CHECKPOINT: true |
|
|
|
LANG_ENCODER: |
|
NAME: transformer |
|
LOAD_PRETRAINED: false |
|
PRETRAINED: '' |
|
PRETRAINED_LAYERS: '*' |
|
TOKENIZER: clip |
|
CONTEXT_LENGTH: 77 |
|
WIDTH: 1024 |
|
HEADS: 16 |
|
LAYERS: 16 |
|
AUTOGRESSIVE: false |
|
|
|
UNICL_MODEL: |
|
DIM_PROJECTION: 1024 |
|
GATHER_TENSORS: true |
|
LOAD_PRETRAINED: true |
|
|
|
|
|
PRETRAINED: '' |
|
|
|
PRETRAINED_LAYERS: '*' |
|
|
|
AUG: |
|
MIXUP_PROB: 0.0 |
|
MIXUP: 0.8 |
|
MIXCUT: 1.0 |
|
MIXCUT_MINMAX: [] |
|
MIXUP_SWITCH_PROB: 0.5 |
|
MIXUP_MODE: 'batch' |
|
SCALE: [0.8, 1.0] |
|
RATIO: [0.75, 1.3333333] |
|
INTERPOLATION: 'bicubic' |
|
TORCHVISION_AUG: |
|
AUTO_AUGMENT: ta_wide |
|
RE_PROB: 0.25 |
|
HFLIP: 0.0 |
|
VFLIP: 0.0 |
|
|
|
LOSS: |
|
LOSS: UniCL |
|
DATASET: |
|
DATASET: 'image_text_pairs_v2' |
|
TEXT_FORMAT: 'json' |
|
ROOT: '' |
|
TRAIN_SET: 'mimic_cxr_v2-chestxray14-chexpertv4-irma2009_v2-rsnaboneage-mura-bingmedicalfewshot' |
|
DATA_FORMAT: 'tsv' |
|
SAMPLER: 'default' |
|
LOADER: 'default' |
|
TOKEN_FILE: '' |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
EVALDATASET_LTCXR_S100_N100_TEXT_CLASSIFIER: |
|
TEXT_FORMAT: json |
|
FORMAT: 'zip' |
|
SPLIT: 'NIH-CXR-LT' |
|
ZIP_FILE: '' |
|
ZIP_MAP_FILE: '' |
|
LABEL_FILE: '' |
|
IMAGE_TSV: '' |
|
TEXT_TSV: '' |
|
CWEIGHT_FILE: '' |
|
ZS_MODE: 2 |
|
ZS_WEIGHT: 1.0 |
|
KNN: 100 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
ZEROSHOT_EVAL_DATASET: |
|
FORMAT: 'zip' |
|
SPLIT: 'NIH-CXR-LT' |
|
ZIP_FILE: '' |
|
ZIP_MAP_FILE: '' |
|
LABEL_FILE: '' |
|
|
|
|
|
|
|
EVALUATION_SPLITS: ['cls-zeroshot-eval'] |
|
TEST: |
|
BATCH_SIZE_PER_GPU: 8 |
|
MODEL_FILE: '' |
|
CENTER_CROP: false |
|
TRAIN: |
|
BATCH_SIZE_TOTAL: 1024 |
|
BATCH_SIZE_PER_GPU: 16 |
|
|
|
SHUFFLE: true |
|
|
|
WEIGHT_SMOOTHING: |
|
decay: 0.999 |
|
use_cpu: False |
|
eval_smoothed_weight: True |
|
|
|
START_LEARNING_RATE: 0.00001 |
|
|
|
MAX_NUM_EPOCHS: 100 |
|
OPTIMIZER: AdamW |
|
OPTIMIZER_PARAMS: |
|
weight_decay: 0.2 |
|
CUSTOMIZED_PARAMS_CONF: |
|
NO_WEIGHT_DECAY_MODULES: ['dw', 'norm'] |
|
WEIGHT_DECAY_PATTERNS: |
|
"\\.bias$": 0.0 |
|
"logit_scale": 0.0 |
|
"positional_embedding": 0.0 |
|
"token_embedding": 0.0 |
|
|
|
|
|
|
|
LR_SCHEDULER: TimmScheduler |
|
LR_SCHEDULER_PARAMS: |
|
sched: cosine |
|
warmup_steps: 5 |
|
warmup_lr: 0.000000001 |
|
min_lr: 0.000000001 |
|
|
|
|
|
|
|
GRADIENT_ACCUMULATE_STEP: -1 |
|
|