import cv2 import os import numpy as np import matplotlib.pyplot as plt # -------------------------- For Detection Task -------------------------- ## Draw bbox & label on the image def plot_bbox_labels(img, bbox, label=None, cls_color=None, text_scale=0.4): x1, y1, x2, y2 = bbox x1, y1, x2, y2 = int(x1), int(y1), int(x2), int(y2) t_size = cv2.getTextSize(label, 0, fontScale=1, thickness=2)[0] # plot bbox cv2.rectangle(img, (x1, y1), (x2, y2), cls_color, 2) if label is not None: # plot title bbox cv2.rectangle(img, (x1, y1-t_size[1]), (int(x1 + t_size[0] * text_scale), y1), cls_color, -1) # put the test on the title bbox cv2.putText(img, label, (int(x1), int(y1 - 5)), 0, text_scale, (0, 0, 0), 1, lineType=cv2.LINE_AA) return img ## Visualize the detection results def visualize(image, bboxes, scores, labels, class_colors, class_names): ts = 0.4 for i, bbox in enumerate(bboxes): cls_id = int(labels[i]) cls_color = class_colors[cls_id] mess = '%s: %.2f' % (class_names[cls_id], scores[i]) image = plot_bbox_labels(image, bbox, mess, cls_color, text_scale=ts) return image ## Visualize the input data during the training stage def vis_data(images, targets, num_classes=80, normalized_bbox=False, color_format='bgr', pixel_mean=None, pixel_std=None, box_format="xyxy"): """ images: (tensor) [B, 3, H, W] targets: (list) a list of targets """ batch_size = images.size(0) np.random.seed(0) class_colors = [(np.random.randint(255), np.random.randint(255), np.random.randint(255)) for _ in range(num_classes)] for bi in range(batch_size): tgt_boxes = targets[bi]['boxes'] tgt_labels = targets[bi]['labels'] # to numpy image = images[bi].permute(1, 2, 0).cpu().numpy() # denormalize image if pixel_mean is not None and pixel_std is not None: image = image * pixel_std + pixel_mean if color_format == 'rgb': image = image[..., (2, 1, 0)] # RGB to BGR image = image.astype(np.uint8) image = image.copy() img_h, img_w = image.shape[:2] # visualize target for box, label in zip(tgt_boxes, tgt_labels): if box_format == "xyxy": x1, y1, x2, y2 = box elif box_format == "xywh": cx, cy, bw, bh = box x1 = cx - 0.5 * bw y1 = cy - 0.5 * bh x2 = cx + 0.5 * bw y2 = cy + 0.5 * bh if normalized_bbox: x1 *= img_w y1 *= img_h x2 *= img_w y2 *= img_h x1, y1 = int(x1), int(y1) x2, y2 = int(x2), int(y2) cls_id = int(label) # draw box color = class_colors[cls_id] cv2.rectangle(image, (x1, y1), (x2, y2), color, 2) cv2.imshow('train target', image) cv2.waitKey(0) ## convert feature to he heatmap def convert_feature_heatmap(feature): """ feature: (ndarray) [H, W, C] """ heatmap = None return heatmap ## draw feature on the image def draw_feature(img, features, save=None): """ img: (ndarray & cv2.Mat) [H, W, C], where the C is 3 for RGB or 1 for Gray. features: (List[ndarray]). It is a list of the multiple feature map whose shape is [H, W, C]. save: (bool) save the result or not. """ img_h, img_w = img.shape[:2] for i, fmp in enumerate(features): hmp = convert_feature_heatmap(fmp) hmp = cv2.resize(hmp, (img_w, img_h)) hmp = hmp.astype(np.uint8)*255 hmp_rgb = cv2.applyColorMap(hmp, cv2.COLORMAP_JET) superimposed_img = hmp_rgb * 0.4 + img # show the heatmap plt.imshow(hmp) plt.close() # show the image with heatmap cv2.imshow("image with heatmap", superimposed_img) cv2.waitKey(0) cv2.destroyAllWindows() if save: save_dir = 'feature_heatmap' os.makedirs(save_dir, exist_ok=True) cv2.imwrite(os.path.join(save_dir, 'feature_{}.png'.format(i) ), superimposed_img) # -------------------------- For Tracking Task -------------------------- def get_color(idx): idx = idx * 3 color = ((37 * idx) % 255, (17 * idx) % 255, (29 * idx) % 255) return color def plot_tracking(image, tlwhs, obj_ids, scores=None, frame_id=0, fps=0., ids2=None): im = np.ascontiguousarray(np.copy(image)) im_h, im_w = im.shape[:2] top_view = np.zeros([im_w, im_w, 3], dtype=np.uint8) + 255 #text_scale = max(1, image.shape[1] / 1600.) #text_thickness = 2 #line_thickness = max(1, int(image.shape[1] / 500.)) text_scale = 2 text_thickness = 2 line_thickness = 3 radius = max(5, int(im_w/140.)) cv2.putText(im, 'frame: %d fps: %.2f num: %d' % (frame_id, fps, len(tlwhs)), (0, int(15 * text_scale)), cv2.FONT_HERSHEY_PLAIN, 2, (0, 0, 255), thickness=2) for i, tlwh in enumerate(tlwhs): x1, y1, w, h = tlwh intbox = tuple(map(int, (x1, y1, x1 + w, y1 + h))) obj_id = int(obj_ids[i]) id_text = '{}'.format(int(obj_id)) if ids2 is not None: id_text = id_text + ', {}'.format(int(ids2[i])) color = get_color(abs(obj_id)) cv2.rectangle(im, intbox[0:2], intbox[2:4], color=color, thickness=line_thickness) cv2.putText(im, id_text, (intbox[0], intbox[1]), cv2.FONT_HERSHEY_PLAIN, text_scale, (0, 0, 255), thickness=text_thickness) return im