# visualize detection results from finetuned detectors on custom images | |
######################################################## | |
# Open-vocabulary detector trained by 866 LVIS base categories, with RegionCLIP (RN50x4) as initialization | |
python3 ./tools/train_net.py \ | |
--eval-only \ | |
--num-gpus 1 \ | |
--config-file ./configs/LVISv1-InstanceSegmentation/CLIP_fast_rcnn_R_50_C4_custom_img.yaml \ | |
MODEL.WEIGHTS ./pretrained_ckpt/regionclip/regionclip_finetuned-lvis_rn50x4.pth \ | |
MODEL.CLIP.TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb_rn50x4.pth \ | |
MODEL.CLIP.OPENSET_TEST_TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb_rn50x4.pth \ | |
MODEL.CLIP.OFFLINE_RPN_CONFIG ./configs/LVISv1-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml \ | |
MODEL.CLIP.BB_RPN_WEIGHTS ./pretrained_ckpt/rpn/rpn_lvis_866_lsj.pth \ | |
MODEL.CLIP.OFFLINE_RPN_LSJ_PRETRAINED True \ | |
MODEL.CLIP.TEXT_EMB_DIM 640 \ | |
MODEL.RESNETS.DEPTH 200 \ | |
MODEL.ROI_BOX_HEAD.POOLER_RESOLUTION 18 \ | |
MODEL.ROI_MASK_HEAD.POOLER_RESOLUTION 18 \ | |
MODEL.RESNETS.RES2_OUT_CHANNELS 320 \ | |
# visualize the prediction json file | |
python ./tools/visualize_json_results.py \ | |
--input ./output/inference/lvis_instances_results.json \ | |
--output ./output/regions \ | |
--dataset lvis_v1_val_custom_img \ | |
--conf-threshold 0.05 \ | |
--show-unique-boxes \ | |
--max-boxes 25 \ | |
--small-region-px 8100\ | |
######################################################## | |
# Open-vocabulary detector trained by 866 LVIS base categories, with RegionCLIP (RN50) as initialization | |
# python3 ./tools/train_net.py \ | |
# --eval-only \ | |
# --num-gpus 1 \ | |
# --config-file ./configs/LVISv1-InstanceSegmentation/CLIP_fast_rcnn_R_50_C4_custom_img.yaml \ | |
# MODEL.WEIGHTS ./pretrained_ckpt/regionclip/regionclip_finetuned-lvis_rn50.pth \ | |
# MODEL.CLIP.TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb.pth \ | |
# MODEL.CLIP.OPENSET_TEST_TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb.pth \ | |
# MODEL.CLIP.OFFLINE_RPN_CONFIG ./configs/LVISv1-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml \ | |
# MODEL.CLIP.BB_RPN_WEIGHTS ./pretrained_ckpt/rpn/rpn_lvis_866_lsj.pth \ | |
# MODEL.CLIP.OFFLINE_RPN_LSJ_PRETRAINED True \ | |
# # visualize the prediction json file | |
# python ./tools/visualize_json_results.py \ | |
# --input ./output/inference/lvis_instances_results.json \ | |
# --output ./output/regions \ | |
# --dataset lvis_v1_val_custom_img \ | |
# --conf-threshold 0.05 \ | |
# --show-unique-boxes \ | |
# --max-boxes 25 \ | |
# --small-region-px 8100\ | |