Add files via upload

CCTiffany · Dec 11, 2020 · cf63a2c · cf63a2c
1 parent a661732
commit cf63a2c
Show file tree

Hide file tree

Showing 100 changed files with 5,691 additions and 0 deletions.
diff --git a/data_gen/bbox.py b/data_gen/bbox.py
@@ -0,0 +1,242 @@
+import numpy as np
+
+from datadescriptor import KittiDescriptor
+from camera_utils import *
+from constants import WINDOW_HEIGHT, WINDOW_WIDTH, MAX_RENDER_DEPTH_IN_METERS, MIN_VISIBLE_VERTICES_FOR_RENDER, VISIBLE_VERTEX_COLOR, OCCLUDED_VERTEX_COLOR, MIN_BBOX_AREA_IN_PX
+from utils import degrees_to_radians
+import logging
+import sys
+import glob
+import os
+
+try:
+    sys.path.append(glob.glob('/home/alex/Documents/CARLA/PythonAPI/carla/dist/carla-*%d.%d-%s.egg' % (
+        sys.version_info.major,
+        sys.version_info.minor,
+        'win-amd64' if os.name == 'nt' else 'linux-x86_64'))[0])
+except IndexError:
+    pass
+
+import carla
+
+
+VIEW_WIDTH = 1920//2
+VIEW_HEIGHT = 1080//2
+VIEW_FOV = 90
+
+BB_COLOR = (248, 64, 24)
+
+# ==============================================================================
+# -- ClientSideBoundingBoxes ---------------------------------------------------
+# ==============================================================================
+
+
+def get_matrix(transform):
+    """
+    Creates matrix from carla transform.
+    """
+
+    rotation = transform.rotation
+    location = transform.location
+    c_y = np.cos(np.radians(rotation.yaw))
+    s_y = np.sin(np.radians(rotation.yaw))
+    c_r = np.cos(np.radians(rotation.roll))
+    s_r = np.sin(np.radians(rotation.roll))
+    c_p = np.cos(np.radians(rotation.pitch))
+    s_p = np.sin(np.radians(rotation.pitch))
+    matrix = np.matrix(np.identity(4))
+    matrix[0, 3] = location.x
+    matrix[1, 3] = location.y
+    matrix[2, 3] = location.z
+    matrix[0, 0] = c_p * c_y
+    matrix[0, 1] = c_y * s_p * s_r - s_y * c_r
+    matrix[0, 2] = -c_y * s_p * c_r - s_y * s_r
+    matrix[1, 0] = s_y * c_p
+    matrix[1, 1] = s_y * s_p * s_r + c_y * c_r
+    matrix[1, 2] = -s_y * s_p * c_r + c_y * s_r
+    matrix[2, 0] = s_p
+    matrix[2, 1] = -c_p * s_r
+    matrix[2, 2] = c_p * c_r
+    return matrix
+
+
+def transform_from_actor(npc):
+    if "walker" in npc.type_id:
+        obj_type='Pedestrian'
+        agent_transform = npc.get_transform()
+        bbox_transform = carla.Transform(npc.bounding_box.location)
+        ext= npc.bounding_box.extent
+        location=agent_transform.location
+    elif "vehicle" in npc.type_id:
+        obj_type='Car'
+        agent_transform = npc.get_transform()
+        bbox_transform = carla.Transform(npc.bounding_box.location)
+        ext= npc.bounding_box.extent
+        location=agent_transform.location
+    else:
+        return (None, None, None, None, None)
+    return obj_type, agent_transform, bbox_transform, ext, location
+
+
+
+def transform_points(points, txm_mat):
+    """
+    Given a 4x4 transformation matrix, transform an array of 3D points.
+    Expected point foramt: [[X0,Y0,Z0],..[Xn,Yn,Zn]]
+    """
+    # Needed foramt: [[X0,..Xn],[Z0,..Zn],[Z0,..Zn]]. So let's transpose
+    # the point matrix.
+    points = points.transpose()
+    # Add 0s row: [[X0..,Xn],[Y0..,Yn],[Z0..,Zn],[0,..0]]
+    points = np.append(points, np.ones((1, points.shape[1])), axis=0)
+    # Point transformation
+    points = txm_mat * points
+    # Return all but last row
+    return points[0:3].transpose()
+
+
+
+def vertices_from_extension(ext):
+    """ Extraxts the 8 bounding box vertices relative to (0,0,0)
+    https://github.com/carla-simulator/carla/commits/master/Docs/img/vehicle_bounding_box.png 
+    8 bounding box vertices relative to (0,0,0)
+    """
+    return 1*np.array([
+        [ext.x,   ext.y,   ext.z],  # Top left front
+        [- ext.x,   ext.y,   ext.z],  # Top left back
+        [ext.x, - ext.y,   ext.z],  # Top right front
+        [- ext.x, - ext.y,   ext.z],  # Top right back
+        [ext.x,   ext.y, - ext.z],  # Bottom left front
+        [- ext.x,   ext.y, - ext.z],  # Bottom left back
+        [ext.x, - ext.y, - ext.z],  # Bottom right front
+        [- ext.x, - ext.y, - ext.z]  # Bottom right back
+    ])
+
+def bbox_2d_from_agent(agent, intrinsic_mat, extrinsic_mat, ext, bbox_transform, agent_transform):  # rotRP expects point to be in Kitti lidar format
+    """ Creates bounding boxes for a given agent and camera/world calibration matrices.
+        Returns the modified image that contains the screen rendering with drawn on vertices from the agent """
+    bbox = vertices_from_extension(ext)
+    # transform the vertices respect to the bounding box transform
+    bbox = transform_points(bbox,get_matrix(bbox_transform))
+    # the bounding box transform is respect to the agents transform
+    # so let's transform the points relative to it's transform
+    bbox = transform_points(bbox,get_matrix(agent_transform))
+    # agents's transform is relative to the world, so now,
+    # bbox contains the 3D bounding box vertices relative to the world
+    # Additionally, you can logging.info these vertices to check that is working
+    # Store each vertex 2d points for drawing bounding boxes later
+    vertices_pos2d = vertices_to_2d_coords(bbox, intrinsic_mat, extrinsic_mat)
+    return vertices_pos2d
+
+
+
+def vertex_to_world_vector(vertex):
+    """ Returns the coordinates of the vector in correct carla world format (X,Y,Z,1) """
+    return np.array([
+        [vertex[0, 0]],  # [[X,
+        [vertex[0, 1]],  # Y,
+        [vertex[0, 2]],  # Z,
+        [1.0]  # 1.0]]
+    ])
+
+def vertices_to_2d_coords(bbox, intrinsic_mat, extrinsic_mat):
+    """ Accepts a bbox which is a list of 3d world coordinates and returns a list 
+        of the 2d pixel coordinates of each vertex. 
+        This is represented as a tuple (y, x, d) where y and x are the 2d pixel coordinates
+        while d is the depth. The depth can be used for filtering visible vertices.
+    """
+    vertices_pos2d = []
+    for vertex in bbox:
+        pos_vector = vertex_to_world_vector(vertex)
+        # Camera coordinates
+        transformed_3d_pos = proj_to_camera(pos_vector, extrinsic_mat)
+        # 2d pixel coordinates
+        pos2d = proj_to_2d(transformed_3d_pos, intrinsic_mat)
+
+        # The actual rendered depth (may be wall or other object instead of vertex)
+        vertex_depth = pos2d[2]
+        x_2d, y_2d = WINDOW_WIDTH - pos2d[0],  WINDOW_HEIGHT - pos2d[1]
+        vertices_pos2d.append((y_2d, x_2d, vertex_depth))
+    return vertices_pos2d
+
+def calculate_occlusion_stats(image, vertices_pos2d, depth_map, draw_vertices=True):
+    """ Draws each vertex in vertices_pos2d if it is in front of the camera 
+        The color is based on whether the object is occluded or not.
+        Returns the number of visible vertices and the number of vertices outside the camera.
+    """
+    num_visible_vertices = 0
+    num_vertices_outside_camera = 0
+    #print("*********************dsadsadsadsadsadsadsada*****")
+    for y_2d, x_2d, vertex_depth in vertices_pos2d:
+        # if the point is in front of the camera but not too far away
+        #print("**************************")
+        #print((y_2d,x_2d))
+        #print("**************************")
+        if MAX_RENDER_DEPTH_IN_METERS > vertex_depth > 0 and point_in_canvas((y_2d, x_2d)):
+            is_occluded = point_is_occluded(
+                (y_2d, x_2d), vertex_depth, depth_map)
+            if is_occluded:
+                vertex_color = OCCLUDED_VERTEX_COLOR
+            else:
+                num_visible_vertices += 1
+                vertex_color = VISIBLE_VERTEX_COLOR
+            if draw_vertices:
+                draw_rect(image, (y_2d, x_2d), 4, vertex_color)
+        else:
+            num_vertices_outside_camera += 1
+    return num_visible_vertices, num_vertices_outside_camera
+
+def get_relative_rotation_y(agent, player):
+    """ Returns the relative rotation of the agent to the camera in yaw
+    The relative rotation is the difference between the camera rotation (on car) and the agent rotation"""
+    # We only car about the rotation for the classes we do detection on
+    if agent.get_transform():
+        rot_agent = agent.get_transform().rotation.yaw
+        rot_car = player.get_transform().rotation.yaw
+        return degrees_to_radians(rot_agent - rot_car)
+
+
+def create_kitti_datapoint(agent, intrinsic_mat, extrinsic_mat, image, depth_image, player_measurements, draw_3D_bbox=True):
+    #print("***************!!!!!!!!!!!!!!!!!!!!!!!!!!***********")
+    """ Calculates the bounding box of the given agent, and returns a KittiDescriptor which describes the object to be labeled """
+    obj_type, agent_transform, bbox_transform, ext, location = transform_from_actor(
+        agent)
+
+    if obj_type is None:
+        logging.warning(
+            "Could not get bounding box for agent. Object type is None")
+        return image, None
+
+    vertices_pos2d=bbox_2d_from_agent(
+        agent, intrinsic_mat, extrinsic_mat, ext, bbox_transform, agent_transform)
+    depth_map = depth_to_array(depth_image)
+    #print("***************!!!!!!!!!!!!!!!!!!!!!!!!!!***********")
+    num_visible_vertices, num_vertices_outside_camera = calculate_occlusion_stats(
+        image, vertices_pos2d, depth_map, draw_vertices=draw_3D_bbox)
+    midpoint = midpoint_from_agent_location(
+        image, location, extrinsic_mat, intrinsic_mat)
+
+    # At least N vertices has to be visible in order to draw bbox
+    if num_visible_vertices >= MIN_VISIBLE_VERTICES_FOR_RENDER and num_vertices_outside_camera < MIN_VISIBLE_VERTICES_FOR_RENDER:
+        midpoint[:3] = midpoint[:3]
+        bbox_2d = calc_projected_2d_bbox(vertices_pos2d)
+        area = calc_bbox2d_area(bbox_2d)
+        if area < MIN_BBOX_AREA_IN_PX:
+            logging.info("Filtered out bbox with too low area {}".format(area))
+            return image, None
+        if draw_3D_bbox:
+            draw_3d_bounding_box(image, vertices_pos2d)
+        from math import pi
+        rotation_y = get_relative_rotation_y(agent, player_measurements) % pi
+
+        datapoint = KittiDescriptor()
+        datapoint.set_bbox(bbox_2d)
+        datapoint.set_3d_object_dimensions(ext)
+        datapoint.set_type(obj_type)
+        datapoint.set_3d_object_location(midpoint)
+        datapoint.set_rotation_y(rotation_y)
+        return image, datapoint
+    else:
+        return image, None
+
+