RegionCLIP / pretrain.sh
akuan123's picture
Upload 16 files
78e1b3b
# NOTE: The pre-training section is still under construction.
# The pre-training code was already released (PretrainFastRCNN class).
# Now we release the config files and scripts (un-tested yet), as requested by researchers.
# We will release the pre-training data (image-text pairs) in near future.
# Distributed training across multiple nodes
# ResNet50 (default: batch 96, lr 0.002, 32 GPUs)
python3 -m launch --nnodes=2 --nproc_per_node=16 --master_port 12345 ./tools/train_net.py \
--num-gpus 16 \
--config-file ./configs/pretrain/RegionCLIP_RN50.yaml \
MODEL.WEIGHTS ./pretrained_ckpt/clip/teacher_RN50_student_RN50_OAI_CLIP.pth \
MODEL.CLIP.OFFLINE_RPN_CONFIG ./configs/LVISv1-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml \
MODEL.CLIP.BB_RPN_WEIGHTS ./pretrained_ckpt/rpn/rpn_lvis_866.pth \
MODEL.CLIP.CONCEPT_POOL_EMB ./pretrained_ckpt/concept_emb/coco_nouns_4764_emb.pth \
OUTPUT_DIR ./output/pretrain \
# ResNet50x4 (default: batch 96, lr 0.002, 32 GPUs)
python3 -m launch --nnodes=2 --nproc_per_node=16 --master_port 12345 ./tools/train_net.py \
--num-gpus 16 \
--config-file ./configs/pretrain/RegionCLIP_RN50x4.yaml \
MODEL.WEIGHTS ./pretrained_ckpt/clip/teacher_RN50x4_student_RN50x4_OAI_CLIP.pth \
MODEL.CLIP.OFFLINE_RPN_CONFIG ./configs/LVISv1-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml \
MODEL.CLIP.BB_RPN_WEIGHTS ./pretrained_ckpt/rpn/rpn_lvis_866.pth \
MODEL.CLIP.CONCEPT_POOL_EMB ./pretrained_ckpt/concept_emb/coco_nouns_4764_emb_rn50x4.pth \
OUTPUT_DIR ./output/pretrain \