Source code for soccer_object_detection.test_object_detection

import os
import os.path
import pickle
import sys
from unittest import TestCase
from unittest.mock import MagicMock

import cv2
import numpy as np
import pytest
import rospy
import tf2_ros
import yaml
from cv2 import Mat
from cv_bridge import CvBridge
from sensor_msgs.msg import CameraInfo, Image

from soccer_common import Camera
from soccer_common.utils import download_dataset
from soccer_common.utils_rosparam import set_rosparam_from_yaml_file
from soccer_msgs.msg import GameState, RobotState
from soccer_object_detection.object_detect_node import Label, ObjectDetectionNode


[docs]def IoU(boxA, boxB): # determine the (x, y)-coordinates of the intersection rectangle xA = max(boxA[0], boxB[0]) yA = max(boxA[1], boxB[1]) xB = min(boxA[2], boxB[2]) yB = min(boxA[3], boxB[3]) # compute the area of intersection rectangle interArea = max(0, xB - xA + 1) * max(0, yB - yA + 1) # compute the area of both the prediction and ground-truth # rectangles boxAArea = (boxA[2] - boxA[0] + 1) * (boxA[3] - boxA[1] + 1) boxBArea = (boxB[2] - boxB[0] + 1) * (boxB[3] - boxB[1] + 1) # compute the intersection over union by taking the intersection # area and dividing it by the sum of prediction + ground-truth # areas - the interesection area iou = interArea / float(boxAArea + boxBArea - interArea) # return the intersection over union value return iou
[docs]class TestObjectDetection(TestCase): def test_object_detection_node(self): src_path = os.path.dirname(os.path.realpath(__file__)) test_path = src_path + "/../../images/simulation" download_dataset("", folder_path=test_path) rospy.init_node("test") Camera.reset_position = MagicMock() src_path = os.path.dirname(os.path.realpath(__file__)) model_path = src_path + "/../../models/" n = ObjectDetectionNode(model_path=model_path) n.robot_state.status = RobotState.STATUS_READY n.game_state.gameState = GameState.GAMESTATE_PLAYING cvbridge = CvBridge() for file_name in os.listdir(f"{test_path}/images"): print(file_name) img: Mat = cv2.imread(os.path.join(f"{test_path}/images", file_name)) # ground truth box = (68, 89) (257, 275) img_original_size = img.size img = cv2.resize(img, dsize=(640, 480)) img_msg: Image = cvbridge.cv2_to_imgmsg(img) # Mock the detections n.pub_detection = MagicMock() n.pub_boundingbox = MagicMock() n.pub_detection.get_num_connections = MagicMock(return_value=1) n.pub_boundingbox.get_num_connections = MagicMock(return_value=1) n.pub_detection.publish = MagicMock() n.pub_boundingbox.publish = MagicMock() ci = CameraInfo() ci.height = img.shape[0] ci.width = img.shape[1] = ci = [0, np.pi / 8, 0] n.callback(img_msg) with open(os.path.join(f"{test_path}/labels", file_name.replace("PNG", "txt"))) as f: lines = f.readlines() if "DISPLAY" in os.environ: mat = cvbridge.imgmsg_to_cv2(n.pub_detection.publish.call_args[0][0]) cv2.imshow("Image", mat) cv2.waitKey(1000) cv2.destroyAllWindows() # Check assertion if n.pub_boundingbox.publish.call_args is not None: for bounding_box in n.pub_boundingbox.publish.call_args[0][0].bounding_boxes: if bounding_box.probability >= n.CONFIDENCE_THRESHOLD and int(bounding_box.Class) in [Label.BALL.value, Label.ROBOT.value]: bounding_boxes = [ bounding_box.xmin, bounding_box.ymin, bounding_box.xmax, bounding_box.ymax, ] best_iou = 0 best_dimensions = None for line in lines: info = line.split(" ") label = int(info[0]) if label != int(bounding_box.Class): continue x = float(info[1]) y = float(info[2]) width = float(info[3]) height = float(info[4]) xmin = int((x - width / 2) * ci.width) ymin = int((y - height / 2) * ci.height) xmax = int((x + width / 2) * ci.width) ymax = int((y + height / 2) * ci.height) ground_truth_boxes = [xmin, ymin, xmax, ymax] iou = IoU(bounding_boxes, ground_truth_boxes) if iou > best_iou: best_iou = iou best_dimensions = ground_truth_boxes self.assertGreater(best_iou, 0.05, f"bounding boxes are off by too much! Image= {file_name} Best IOU={best_iou}") if best_iou < 0.5: rospy.logwarn(f"bounding boxes lower than 0.5 Image= {file_name} Best IOU={best_iou}") # if "DISPLAY" in os.environ: # cv2.rectangle( # img=mat, # pt1=(best_dimensions[0], best_dimensions[1]), # pt2=(best_dimensions[2], best_dimensions[3]), # color=(255, 255, 255), # ) # if bounding_box.obstacle_detected is True: #, (bounding_box.xbase, bounding_box.ybase), 0, (0, 255, 255), 3) if "DISPLAY" in os.environ: cv2.imshow("Image", mat) cv2.waitKey() cv2.destroyAllWindows() def test_object_detection_node_cam(self): rospy.init_node("test") Camera.reset_position = MagicMock() src_path = os.path.dirname(os.path.realpath(__file__)) model_path = src_path + "/../../models/" n = ObjectDetectionNode(model_path=model_path) n.robot_state.status = RobotState.STATUS_READY n.game_state.gameState = GameState.GAMESTATE_PLAYING cap = cv2.VideoCapture(4) if not cap.isOpened(): print("Cannot open camera") exit() cvbridge = CvBridge() while True: ret, frame = if not ret: print("Can't receive frame (stream end?). Exiting ...") break img = cv2.resize(frame, dsize=(640, 480)) img_msg: Image = cvbridge.cv2_to_imgmsg(img) # Mock the detections n.pub_detection = MagicMock() n.pub_boundingbox = MagicMock() n.pub_detection.get_num_connections = MagicMock(return_value=1) n.pub_boundingbox.get_num_connections = MagicMock(return_value=1) n.pub_detection.publish = MagicMock() n.pub_boundingbox.publish = MagicMock() ci = CameraInfo() ci.height = img.shape[0] ci.width = img.shape[1] = ci = [0, np.pi / 8, 0] n.callback(img_msg) if "DISPLAY" in os.environ: mat = cvbridge.imgmsg_to_cv2(n.pub_detection.publish.call_args[0][0]) cv2.imshow("Image", mat) cv2.waitKey(1) # cv2.destroyAllWindows() # Check assertion if n.pub_boundingbox.publish.call_args is not None: for bounding_box in n.pub_boundingbox.publish.call_args[0][0].bounding_boxes: if bounding_box.probability >= n.CONFIDENCE_THRESHOLD and int(bounding_box.Class) in [Label.BALL.value, Label.ROBOT.value]: bounding_boxes = [ bounding_box.xmin, bounding_box.ymin, bounding_box.xmax, bounding_box.ymax, ] best_iou = 0 best_dimensions = None # for line in lines: # info = line.split(" ") # label = int(info[0]) # if label != int(bounding_box.Class): # continue # # x = float(info[1]) # y = float(info[2]) # width = float(info[3]) # height = float(info[4]) # # xmin = int((x - width / 2) * ci.width) # ymin = int((y - height / 2) * ci.height) # xmax = int((x + width / 2) * ci.width) # ymax = int((y + height / 2) * ci.height) # ground_truth_boxes = [xmin, ymin, xmax, ymax] # iou = IoU(bounding_boxes, ground_truth_boxes) # if iou > best_iou: # best_iou = iou # best_dimensions = ground_truth_boxes # self.assertGreater(best_iou, 0.05, f"bounding boxes are off by too much! Image= {file_name} Best IOU={best_iou}") # if best_iou < 0.5: # rospy.logwarn(f"bounding boxes lower than 0.5 Image= {file_name} Best IOU={best_iou}") # if "DISPLAY" in os.environ: # cv2.rectangle( # img=mat, # pt1=(best_dimensions[0], best_dimensions[1]), # pt2=(best_dimensions[2], best_dimensions[3]), # color=(255, 255, 255), # ) # if bounding_box.obstacle_detected is True: #, (bounding_box.xbase, bounding_box.ybase), 0, (0, 255, 255), 3) if "DISPLAY" in os.environ: cv2.imshow("Image", mat) cv2.waitKey(1) # cv2.destroyAllWindows() @pytest.mark.skip(reason="Only run locally") def test_visualize_annotations(self): src_path = os.path.dirname(os.path.realpath(__file__)) # Data downloaded from annotation_path = "/home/robosoccer/hdd/dataset/dataV2/TORSO-21/simulation/train/annotations.yaml" annotation_pickle = "/home/robosoccer/hdd/dataset/dataV2/TORSO-21/simulation/train/annotation.pkl" image_path = "/home/robosoccer//hdd/dataset/dataV2/TORSO-21/simulation/train/images" if not os.path.exists(annotation_pickle): with open(annotation_path) as f: print("Pickling annotation, will take a long time") yaml_data = yaml.load(f) with open(annotation_pickle, "wb") as f2: pickle.dump(yaml_data, f2) return MAX_DIMENSIONS = (1778, 1000) with open(annotation_pickle, "rb") as f: annos = pickle.load(f)["images"] print( "Press 's' and 'd' to move between images. 'A' and 'S' let you jump 100 images.\n'c' to correct a label\n'v' to save image.\n'q' closes.\n'n' toggles not in image text. 'o' to toggle showing obstacles\n'e' to toggle all annotations" ) files = list(annos) files.sort() not_in_image = True show_obstacles = True show_annotations = True i = 0 while True: f = files[i] if "5733" not in f: print(f) i += 1 continue img_path = os.path.join(image_path, f) img = cv2.imread(img_path) assert img is not None h, w, c = img.shape text_thickness = int(w / 200) line_thickness = int(w / 200) y = 20 image_annos = annos[f]["annotations"] # sort lables to have them in the correct order. image_annos_sorted = [] correct_order = { "field edge": 0, "goalpost": 1, "left_goalpost": 2, "right_goalpost": 3, "crossbar": 4, "robot": 5, "obstacle": 6, "ball": 7, "L-Intersection": 8, "T-Intersection": 9, "X-Intersection": 10, } for a in image_annos: a["order"] = correct_order[a["type"]] image_annos_sorted = sorted(image_annos, key=lambda a: a["order"]) for a in image_annos_sorted: if show_annotations: if not a["in_image"] and "vector" in a: cv2.putText( img, f"{a['type']} completely concealed in image", (0, y), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), int(text_thickness / 2), ) y += 20 elif not a["in_image"]: if not_in_image: cv2.putText( img, f"{a['type']} not in image", (0, y), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), int(text_thickness / 2) ) y += 20 else: if a["type"] == "robot": color = (255, 0, 0) elif a["type"] == "ball": color = (0, 0, 255) elif a["type"] == "goalpost": color = (0, 255, 255) elif a["type"] == "left_goalpost": color = (255, 0, 255) elif a["type"] == "right_goalpost": color = (0, 255, 255) elif a["type"] == "crossbar": color = (0, 0, 255) elif a["type"] == "field edge": color = (0, 255, 0) elif a["type"] == "obstacle": color = (0, 0, 0) if a["type"] == "obstacle" and not show_obstacles: pass elif a["type"] == "robot" or a["type"] == "ball" or a["type"] == "obstacle": # bounding boxes x_start = int(a["vector"][0][0]) x_stop = int(a["vector"][1][0]) y_start = int(a["vector"][0][1]) y_stop = int(a["vector"][1][1]) contours = np.ndarray((4, 2), dtype=int) contours[0][0] = x_start contours[0][1] = y_start contours[1][0] = x_start contours[1][1] = y_stop contours[2][0] = x_stop contours[2][1] = y_stop contours[3][0] = x_stop contours[3][1] = y_start cv2.drawContours(img, [contours], -1, color, line_thickness) elif a["type"] == "goalpost" or a["type"] == "left_goalpost" or a["type"] == "right_goalpost" or a["type"] == "crossbar": contours = np.ndarray((4, 2), dtype=int) contours[0][0] = int(a["vector"][0][0]) contours[0][1] = int(a["vector"][0][1]) contours[1][0] = int(a["vector"][1][0]) contours[1][1] = int(a["vector"][1][1]) contours[2][0] = int(a["vector"][2][0]) contours[2][1] = int(a["vector"][2][1]) contours[3][0] = int(a["vector"][3][0]) contours[3][1] = int(a["vector"][3][1]) cv2.drawContours(img, [contours], -1, color, line_thickness) elif a["type"] == "field edge": points = [] for point in a["vector"]: points.append(point) pts = np.array(points, np.int32) pts = pts.reshape((-1, 1, 2)) img = cv2.polylines(img, [pts], False, color, line_thickness) else: color = (0, 0, 0) if a["type"] == "L-Intersection": txt = "L" elif a["type"] == "T-Intersection": txt = "T" elif a["type"] == "X-Intersection": txt = "X" else: print(a["type"]) exit(1) txt_size = cv2.getTextSize(txt, cv2.FONT_HERSHEY_COMPLEX, 1, text_thickness) cv2.putText( img, txt, (int(a["vector"][0][0] - (txt_size[0][0] / 2)), int(a["vector"][0][1] + (txt_size[0][1] / 2))), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 0), text_thickness, ) if h > MAX_DIMENSIONS[1]: scaling = MAX_DIMENSIONS[1] / h img = cv2.resize(img, (int(w * scaling), int(h * scaling))) cv2.imshow("img", img) key = cv2.waitKey(0) if key in [100]: # d i += 1 elif key == 68: # D i += 100 elif key in [115]: # s i -= 1 elif key == 83: # S i -= 100 elif key in [27, 113]: exit(0) elif key == 110: # n not_in_image = not not_in_image elif key == 111: # o show_obstacles = not show_obstacles elif key == 118: # v cv2.imwrite(f"../viz_{f}", img) elif key == 99: # c img_id = annos[f]["id"] os.system(f"firefox --new-tab{img_id}/") elif key == 101: show_annotations = not show_annotations i = max(0, i) i = min(len(files), i) sys.stdout.write("\x1b[A") sys.stdout.write("\x1b[A") print(f"Current image number {i} name {f}\n")