akuan123
/

RegionCLIP

Model card Files Files and versions Community

RegionCLIP / visualize_transfer_learning.sh

akuan123's picture

Upload 16 files

78e1b3b almost 2 years ago

history blame contribute delete

2.45 kB

	# visualize detection results from finetuned detectors on custom images

	########################################################

	# Open-vocabulary detector trained by 866 LVIS base categories, with RegionCLIP (RN50x4) as initialization
	python3 ./tools/train_net.py \
	--eval-only \
	--num-gpus 1 \
	--config-file ./configs/LVISv1-InstanceSegmentation/CLIP_fast_rcnn_R_50_C4_custom_img.yaml \
	MODEL.WEIGHTS ./pretrained_ckpt/regionclip/regionclip_finetuned-lvis_rn50x4.pth \
	MODEL.CLIP.TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb_rn50x4.pth \
	MODEL.CLIP.OPENSET_TEST_TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb_rn50x4.pth \
	MODEL.CLIP.OFFLINE_RPN_CONFIG ./configs/LVISv1-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml \
	MODEL.CLIP.BB_RPN_WEIGHTS ./pretrained_ckpt/rpn/rpn_lvis_866_lsj.pth \
	MODEL.CLIP.OFFLINE_RPN_LSJ_PRETRAINED True \
	MODEL.CLIP.TEXT_EMB_DIM 640 \
	MODEL.RESNETS.DEPTH 200 \
	MODEL.ROI_BOX_HEAD.POOLER_RESOLUTION 18 \
	MODEL.ROI_MASK_HEAD.POOLER_RESOLUTION 18 \
	MODEL.RESNETS.RES2_OUT_CHANNELS 320 \

	# visualize the prediction json file
	python ./tools/visualize_json_results.py \
	--input ./output/inference/lvis_instances_results.json \
	--output ./output/regions \
	--dataset lvis_v1_val_custom_img \
	--conf-threshold 0.05 \
	--show-unique-boxes \
	--max-boxes 25 \
	--small-region-px 8100\


	########################################################

	# Open-vocabulary detector trained by 866 LVIS base categories, with RegionCLIP (RN50) as initialization
	# python3 ./tools/train_net.py \
	# --eval-only \
	# --num-gpus 1 \
	# --config-file ./configs/LVISv1-InstanceSegmentation/CLIP_fast_rcnn_R_50_C4_custom_img.yaml \
	# MODEL.WEIGHTS ./pretrained_ckpt/regionclip/regionclip_finetuned-lvis_rn50.pth \
	# MODEL.CLIP.TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb.pth \
	# MODEL.CLIP.OPENSET_TEST_TEXT_EMB_PATH ./pretrained_ckpt/concept_emb/lvis_1203_cls_emb.pth \
	# MODEL.CLIP.OFFLINE_RPN_CONFIG ./configs/LVISv1-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml \
	# MODEL.CLIP.BB_RPN_WEIGHTS ./pretrained_ckpt/rpn/rpn_lvis_866_lsj.pth \
	# MODEL.CLIP.OFFLINE_RPN_LSJ_PRETRAINED True \

	# # visualize the prediction json file
	# python ./tools/visualize_json_results.py \
	# --input ./output/inference/lvis_instances_results.json \
	# --output ./output/regions \
	# --dataset lvis_v1_val_custom_img \
	# --conf-threshold 0.05 \
	# --show-unique-boxes \
	# --max-boxes 25 \
	# --small-region-px 8100\