Spaces:
Sleeping
Sleeping
# -*- coding: utf-8 -*- | |
# Copyright (c) Alibaba, Inc. and its affiliates. | |
import cv2 | |
import numpy as np | |
from .utils import convert_to_numpy | |
class LayoutBboxAnnotator: | |
def __init__(self, cfg, device=None): | |
self.bg_color = cfg.get('BG_COLOR', [255, 255, 255]) | |
self.box_color = cfg.get('BOX_COLOR', [0, 0, 0]) | |
self.frame_size = cfg.get('FRAME_SIZE', [720, 1280]) # [H, W] | |
self.num_frames = cfg.get('NUM_FRAMES', 81) | |
ram_tag_color_path = cfg.get('RAM_TAG_COLOR_PATH', None) | |
self.color_dict = {'default': tuple(self.box_color)} | |
if ram_tag_color_path is not None: | |
lines = [id_name_color.strip().split('#;#') for id_name_color in open(ram_tag_color_path).readlines()] | |
self.color_dict.update({id_name_color[1]: tuple(eval(id_name_color[2])) for id_name_color in lines}) | |
def forward(self, bbox, frame_size=None, num_frames=None, label=None, color=None): | |
frame_size = frame_size if frame_size is not None else self.frame_size | |
num_frames = num_frames if num_frames is not None else self.num_frames | |
assert len(bbox) == 2, 'bbox should be a list of two elements (start_bbox & end_bbox)' | |
# frame_size = [H, W] | |
# bbox = [x1, y1, x2, y2] | |
label = label[0] if label is not None and isinstance(label, list) else label | |
if label is not None and label in self.color_dict: | |
box_color = self.color_dict[label] | |
elif color is not None: | |
box_color = color | |
else: | |
box_color = self.color_dict['default'] | |
start_bbox, end_bbox = bbox | |
start_bbox = [start_bbox[0], start_bbox[1], start_bbox[2] - start_bbox[0], start_bbox[3] - start_bbox[1]] | |
start_bbox = np.array(start_bbox, dtype=np.float32) | |
end_bbox = [end_bbox[0], end_bbox[1], end_bbox[2] - end_bbox[0], end_bbox[3] - end_bbox[1]] | |
end_bbox = np.array(end_bbox, dtype=np.float32) | |
bbox_increment = (end_bbox - start_bbox) / num_frames | |
ret_frames = [] | |
for frame_idx in range(num_frames): | |
frame = np.zeros((frame_size[0], frame_size[1], 3), dtype=np.uint8) | |
frame[:] = self.bg_color | |
current_bbox = start_bbox + bbox_increment * frame_idx | |
current_bbox = current_bbox.astype(int) | |
x, y, w, h = current_bbox | |
cv2.rectangle(frame, (x, y), (x + w, y + h), box_color, 2) | |
ret_frames.append(frame[..., ::-1]) | |
return ret_frames | |
class LayoutMaskAnnotator: | |
def __init__(self, cfg, device=None): | |
self.use_aug = cfg.get('USE_AUG', False) | |
self.bg_color = cfg.get('BG_COLOR', [255, 255, 255]) | |
self.box_color = cfg.get('BOX_COLOR', [0, 0, 0]) | |
ram_tag_color_path = cfg.get('RAM_TAG_COLOR_PATH', None) | |
self.color_dict = {'default': tuple(self.box_color)} | |
if ram_tag_color_path is not None: | |
lines = [id_name_color.strip().split('#;#') for id_name_color in open(ram_tag_color_path).readlines()] | |
self.color_dict.update({id_name_color[1]: tuple(eval(id_name_color[2])) for id_name_color in lines}) | |
if self.use_aug: | |
from .maskaug import MaskAugAnnotator | |
self.maskaug_anno = MaskAugAnnotator(cfg={}) | |
def find_contours(self, mask): | |
contours, hier = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE) | |
return contours | |
def draw_contours(self, canvas, contour, color): | |
canvas = np.ascontiguousarray(canvas, dtype=np.uint8) | |
canvas = cv2.drawContours(canvas, contour, -1, color, thickness=3) | |
return canvas | |
def forward(self, mask=None, color=None, label=None, mask_cfg=None): | |
if not isinstance(mask, list): | |
is_batch = False | |
mask = [mask] | |
else: | |
is_batch = True | |
if label is not None and label in self.color_dict: | |
color = self.color_dict[label] | |
elif color is not None: | |
color = color | |
else: | |
color = self.color_dict['default'] | |
ret_data = [] | |
for sub_mask in mask: | |
sub_mask = convert_to_numpy(sub_mask) | |
if self.use_aug: | |
sub_mask = self.maskaug_anno.forward(sub_mask, mask_cfg) | |
canvas = np.ones((sub_mask.shape[0], sub_mask.shape[1], 3)) * 255 | |
contour = self.find_contours(sub_mask) | |
frame = self.draw_contours(canvas, contour, color) | |
ret_data.append(frame) | |
if is_batch: | |
return ret_data | |
else: | |
return ret_data[0] | |
class LayoutTrackAnnotator: | |
def __init__(self, cfg, device=None): | |
self.use_aug = cfg.get('USE_AUG', False) | |
self.bg_color = cfg.get('BG_COLOR', [255, 255, 255]) | |
self.box_color = cfg.get('BOX_COLOR', [0, 0, 0]) | |
ram_tag_color_path = cfg.get('RAM_TAG_COLOR_PATH', None) | |
self.color_dict = {'default': tuple(self.box_color)} | |
if ram_tag_color_path is not None: | |
lines = [id_name_color.strip().split('#;#') for id_name_color in open(ram_tag_color_path).readlines()] | |
self.color_dict.update({id_name_color[1]: tuple(eval(id_name_color[2])) for id_name_color in lines}) | |
if self.use_aug: | |
from .maskaug import MaskAugAnnotator | |
self.maskaug_anno = MaskAugAnnotator(cfg={}) | |
from .inpainting import InpaintingVideoAnnotator | |
self.inpainting_anno = InpaintingVideoAnnotator(cfg=cfg['INPAINTING']) | |
def find_contours(self, mask): | |
contours, hier = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE) | |
return contours | |
def draw_contours(self, canvas, contour, color): | |
canvas = np.ascontiguousarray(canvas, dtype=np.uint8) | |
canvas = cv2.drawContours(canvas, contour, -1, color, thickness=3) | |
return canvas | |
def forward(self, color=None, mask_cfg=None, frames=None, video=None, mask=None, bbox=None, label=None, caption=None, mode=None): | |
inp_data = self.inpainting_anno.forward(frames, video, mask, bbox, label, caption, mode) | |
inp_masks = inp_data['masks'] | |
label = label[0] if label is not None and isinstance(label, list) else label | |
if label is not None and label in self.color_dict: | |
color = self.color_dict[label] | |
elif color is not None: | |
color = color | |
else: | |
color = self.color_dict['default'] | |
num_frames = len(inp_masks) | |
ret_data = [] | |
for i in range(num_frames): | |
sub_mask = inp_masks[i] | |
if self.use_aug and mask_cfg is not None: | |
sub_mask = self.maskaug_anno.forward(sub_mask, mask_cfg) | |
canvas = np.ones((sub_mask.shape[0], sub_mask.shape[1], 3)) * 255 | |
contour = self.find_contours(sub_mask) | |
frame = self.draw_contours(canvas, contour, color) | |
ret_data.append(frame) | |
return ret_data | |