leiwx52's picture
VLog hf gradio demo
5a444be
raw
history blame
1.63 kB
from detectron2.config import CfgNode as CN
def add_grit_config(cfg):
_C = cfg
_C.MODEL.BEAM_SIZE = 1
_C.MODEL.TRAIN_TASK = ["ObjectDet", "DenseCap"]
_C.MODEL.TEST_TASK = "DenseCap" # This can be varied if the model is jointly trained on multiple tasks
_C.MODEL.ROI_BOX_HEAD.USE_BIAS = 0.0 # >= 0: not use
_C.MODEL.ROI_BOX_HEAD.MULT_PROPOSAL_SCORE = False
_C.MODEL.ROI_HEADS.MASK_WEIGHT = 1.0
_C.MODEL.ROI_HEADS.OBJECT_FEAT_POOLER_RES = 14
_C.MODEL.ROI_HEADS.SOFT_NMS_ENABLED = False
# Backbones
_C.MODEL.VIT_LAYERS = 12
# Text Decoder
_C.TEXT_DECODER = CN()
_C.TEXT_DECODER.VOCAB_SIZE = 30522
_C.TEXT_DECODER.HIDDEN_SIZE = 768
_C.TEXT_DECODER.NUM_LAYERS = 6
_C.TEXT_DECODER.ATTENTION_HEADS = 12
_C.TEXT_DECODER.FEEDFORWARD_SIZE = 768 * 4
# Multi-dataset dataloader
_C.DATALOADER.DATASET_RATIO = [1, 1] # sample ratio
_C.DATALOADER.DATASET_BS = 1
_C.DATALOADER.DATASET_INPUT_SIZE = [1024, 1024]
_C.DATALOADER.DATASET_INPUT_SCALE = [(0.1, 2.0), (0.1, 2.0)]
_C.DATALOADER.DATASET_MIN_SIZES = [(640, 800), (640, 800)]
_C.DATALOADER.DATASET_MAX_SIZES = [1333, 1333]
_C.SOLVER.USE_CUSTOM_SOLVER = True
_C.SOLVER.OPTIMIZER = 'ADAMW'
_C.SOLVER.VIT_LAYER_DECAY = True
_C.SOLVER.VIT_LAYER_DECAY_RATE = 0.7
_C.INPUT.CUSTOM_AUG = 'EfficientDetResizeCrop'
_C.INPUT.TRAIN_SIZE = 1024
_C.INPUT.TEST_SIZE = 1024
_C.INPUT.SCALE_RANGE = (0.1, 2.)
# 'default' for fixed short / long edge
_C.INPUT.TEST_INPUT_TYPE = 'default'
_C.FIND_UNUSED_PARAM = True
_C.USE_ACT_CHECKPOINT = True