_BASE_: "Base.yaml" | |
MODEL: | |
TRAIN_TASK: ["DenseCap"] | |
TEST_TASK: "DenseCap" | |
MASK_ON: False | |
ROI_HEADS: | |
SOFT_NMS_ENABLED: False | |
BEAM_SIZE: 1 | |
WEIGHTS: "detectron2://ImageNetPretrained/MAE/mae_pretrain_vit_base.pth" | |
BACKBONE: | |
NAME: build_vit_fpn_backbone | |
VIT_LAYERS: 12 | |
SOLVER: | |
VIT_LAYER_DECAY_RATE: 0.7 | |
DATASETS: | |
TRAIN: ("vg_train",) | |
TEST: ("vg_test",) | |
DATALOADER: | |
DATASET_BS: 2 | |
OUTPUT_DIR: "./output/GRiT_B_DenseCap" |