driverless-2019/video.py at master · Unicamp-E-Racing/driverless-2019 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
from time import time
import numpy as np
import cv2
import math
from pydarknet import Detector, Image
from constants import *
if CAPTURE_MODE == "ZED_SDK":
    import pyzed.sl as sl
    zed = sl.Camera()
    init_params = sl.InitParameters()
    init_params.camera_resolution = sl.RESOLUTION.HD720
    init_params.depth_mode = sl.DEPTH_MODE.PERFORMANCE
    init_params.coordinate_units = sl.UNIT.METER
    err = zed.open(init_params)
    if err != sl.ERROR_CODE.SUCCESS:
        print("ERROR OPENING ZED CAMERA WITH SDK")
        exit(1)
    image = sl.Mat()
    depth_map = sl.Mat()
    point_cloud = sl.Mat()
    runtime_parameters = sl.RuntimeParameters()
elif CAPTURE_MODE == "OPENCV":
    cam = cv2.VideoCapture(CAMERA_INDEX)
    cam.set(cv2.CAP_PROP_FRAME_WIDTH, OPENCV_CAMERA_WIDTH)
    cam.set(cv2.CAP_PROP_FRAME_HEIGHT, OPENCV_CAMERA_HEIGHT)

if DETECTION_MODE == "YOLO":
    net = Detector(bytes(YOLO_PATH_CONFIG[YOLO_VERSION], encoding="utf-8"), bytes(YOLO_PATH_WEIGHTS[YOLO_VERSION], encoding="utf-8"), 0, bytes(YOLO_PATH_DATA[YOLO_VERSION],encoding="utf-8"))


def get_frame():
    if CAPTURE_MODE == "ZED_SDK":
        if zed.grab(runtime_parameters) == sl.ERROR_CODE.SUCCESS:
            # A new image is available if grab() returns SUCCESS
            zed.retrieve_image(image, sl.VIEW.LEFT)
        return cv2.cvtColor(image.get_data(), cv2.COLOR_RGBA2RGB)
    else:
        _, frame = cam.read()
        if FLIP_IMG:
            frame = cv2.flip(frame, 0)
            frame = cv2.flip(frame, 1)
        return frame[:,:OPENCV_FRAME_WIDTH_CUT,:] # cut half left of image

def detect(frame):
    img_darknet = Image(frame)
    results = net.detect(img_darknet, thresh=DETECTION_THRESHOLD)
    return [[x,y,w,h,cat,score] for cat, score, (x, y, w, h) in results]

def get_mono_pos(rects):
    cones_blue = [[],[]]
    cones_yellow = [[],[]]
    print_info = ""
    for rect in rects:
        y = (CONE_HEIGHT * FOCAL) / (rect[3]*PIXEL_SIZE)
        u = (rect[0]-U_OFFSET)
        x = u*PIXEL_SIZE*y/FOCAL
        v = (rect[1]-V_OFFSET)
        z = v*PIXEL_SIZE*y/FOCAL
        print_info += f"Cone height:{rect[3]} px \n"
        print_info += f"Cone x:{x/10} cm, y:{y/10} cm \n"

        x /= 1000
        x += X_OFFSET
        y /= 1000
        z /= 1000

        ratio = rect[2]/rect[3]

        if MIN_RATIO <= ratio <= MAX_RATIO:
            if MIN_DISTANCE <= y <= MAX_DISTANCE:
                if not math.isinf(x) or not math.isinf(y) or not math.isnan(x) or not math.isnan(y):
                    if rect[4] == b'blue_cone':
                        cones_blue[0].append([x,y])
                        cones_blue[1].append(rect)
                    elif rect[4] == b'yellow_cone':
                        cones_yellow[0].append([x,y])
                        cones_yellow[1].append(rect)
            else:
                ignored_by_y_dist += 1
        else:
            ignored_by_ratio += 1

    print_info += f"Input:\n    Cones Detected:{len(rects):>3}\n"
    print_info += f"    Cones Returned:\n        Blue:{len(cones_blue):>5}\n        Yellow:{len(cones_yellow):>3}\n"
    print_info += f"    Ignored cones:\n        Ratio:{ignored_by_ratio:>4}\n        Y Dist:{ignored_by_y_dist:>3}\n"

    return cones_blue, cones_yellow, print_info

def get_stereo_pos(rects):
    cones_blue = [[],[]]
    cones_yellow = [[],[]]
    print_info = ""
    for rect in rects:
        zed.retrieve_measure(point_cloud, sl.MEASURE.XYZRGBA)
        #zed.retrieve_measure(depth_map, sl.MEASURE.DEPTH) # Retrieve depth
        err, point3D = point_cloud.get_value(rect[0],rect[1])
        if err == sl.ERROR_CODE.SUCCESS:
            x = point3D[0]
            z = point3D[1]
            y = point3D[2]
            if not math.isinf(x) and not math.isinf(y) and not math.isnan(x) and not math.isnan(y):
                if rect[4] == b'blue_cone' or rect[4] == b'BLUE_CONE':
                    cones_blue[0].append([y,-x + X_OFFSET ])
                    cones_blue[1].append(rect)
                elif rect[4] == b'yellow_cone' or rect[4] == b'YELLOW_CONE':
                    cones_yellow[0].append([y,-x + X_OFFSET])
                    cones_yellow[1].append(rect)

    return cones_blue, cones_yellow, print_info

def get_pos(rects):
    if MESURMENT_MODE == "MONO":
        cones_blue, cones_yellow, print_info = get_mono_pos(rects)
    elif MESURMENT_MODE == "STEREO":
        cones_blue, cones_yellow, print_info = get_stereo_pos(rects)


    return cones_blue, cones_yellow, print_info


def run():
    frame_time_start = time()
    frame = get_frame()
    frame_time = (time() - frame_time_start) * 1000

    detect_time_start = time()
    rects = detect(frame)
    detect_time = (time() - detect_time_start) * 1000

    img = frame.copy()

    frame_time_start = time()
    cones_blue, cones_yellow, print_info = get_pos(rects)
    get_pos_time = (time() - frame_time_start) * 1000

    if SHOW_IMG:
        if len(cones_blue[0]):
            for i in range(len(cones_blue[0])):
                x,y = cones_blue[0][i]
                u,v,w,h,cat,_ = cones_blue[1][i]
                cv2.rectangle(img, (int(u - w / 2), int(v - h / 2)), (int(u + w / 2), int(v + h / 2)), (255, 0, 0), thickness=2)
                cv2.putText(img, str(f"x:{x:.2f} m"),(int(u),int(v)),cv2.FONT_HERSHEY_COMPLEX,1,(255,255,0))
                cv2.putText(img, str(f"y:{y:.2f} m"),(int(u),int(v+30)),cv2.FONT_HERSHEY_COMPLEX,1,(255,255,0))

        if len(cones_yellow[0]):
            for i in range(len(cones_yellow[0])):
                x,y = cones_yellow[0][i]
                u,v,w,h,cat,_ = cones_yellow[1][i]
                cv2.rectangle(img, (int(u - w / 2), int(v - h / 2)), (int(u + w / 2), int(v + h / 2)), (0, 255, 255), thickness=2)
                cv2.putText(img, str(f"x:{x:.2f} m"),(int(u),int(v)),cv2.FONT_HERSHEY_COMPLEX,1,(255,255,0))
                cv2.putText(img, str(f"y:{y:.2f} m"),(int(u),int(v+30)),cv2.FONT_HERSHEY_COMPLEX,1,(255,255,0))


    print_info += f"    Times:\n        Frame:{frame_time:>7.0f} ms\n        Detect:{detect_time:>6.0f} ms\n        get_pos:{get_pos_time:>5.0f} ms\n\n"

    return np.array(cones_blue[0]), np.array(cones_yellow[0]), print_info, img


if __name__ == "__main__":
    print("Starting test")

    blue, yellow , print_info, img = run()

    print(f"blue cones: {blue}\nyellow cones: {yellow}\n")