berkeleyauv · nLevin13 · Jan 18, 2021 · Nov 9, 2020 · Nov 23, 2020 · Dec 5, 2020
diff --git a/.gitattributes b/.gitattributes
@@ -0,0 +1 @@
+*.zip filter=lfs diff=lfs merge=lfs -text
diff --git a/.gitignore b/.gitignore
@@ -18,3 +18,5 @@ __pycache__/
 # IDE files
 .idea
 .vs_code/
+
+data/
diff --git a/perception/__init__.py b/perception/__init__.py
@@ -1,8 +1,14 @@
-import perception.tasks.TestTasks.TestAlgo as TestAlgo
-import perception.tasks.gate.GateCenter as GateSeg
+import perception.vis.TestAlgo as TestAlgo
+import perception.tasks.gate.GateCenterAlgo as GateSeg
+import perception.tasks.gate.GateSegmentationAlgoA as GateSegA
+import perception.tasks.gate.GateSegmentationAlgoB as GateSegB
+import perception.tasks.gate.GateSegmentationAlgoC as GateSegC
 # import perception.tasks as tasks
 
 ALGOS = {
     'test': TestAlgo.TestAlgo,
-    'gateseg': GateSeg.GateCenter
+    'gateseg': GateSeg.GateCenterAlgo,
+    'gatesegA': GateSegA.GateSegmentationAlgoA,
+    'gatesegB': GateSegB.GateSegmentationAlgoB,
+    'gatesegC': GateSegC.GateSegmentationAlgoC
 }
diff --git a/perception/tasks/TaskPerceiver.py b/perception/tasks/TaskPerceiver.py
@@ -1,8 +1,8 @@
-from typing import Any, Dict, Tuple
+from typing import Any, Dict
 import numpy as np
 
-class TaskPerceiver:
 
+class TaskPerceiver:
     def __init__(self, **kwargs):
         """Initializes the TaskPerceiver.
         Args:
@@ -11,22 +11,18 @@ def __init__(self, **kwargs):
                 for the slider which controls this variable, and default_val is
                 the initial value of the slider.
         """
-        self.time = 0
         self.kwargs = kwargs
 
     def analyze(self, frame: np.ndarray, debug: bool, slider_vals: Dict[str, int]) -> Any:
         """Runs the algorithm and returns the result.
         Args:
-			frame: The frame to analyze
+            frame: The frame to analyze
             debug: Whether or not to display intermediate images for debugging
             slider_vals: A list of names of the variables which the user should be
                 able to control from the Visualizer, mapped to current slider
                 value for that variable
-		Returns:
-			the result of the algorithm
-			debug frames must each be same size as original input frame. Might change this in the future.
+        Returns:
+            the result of the algorithm
+            debug frames must each be same size as original input frame. Might change this in the future.
         """
         raise NotImplementedError("Need to implement with child class.")
-
-    def var_info(self) -> Dict[str, Tuple[Tuple[int, int], int]]:
-        return self.kwargs
diff --git a/perception/tasks/cross/CrossPerceiver.py b/perception/tasks/cross/CrossPerceiver.py
diff --git a/perception/tasks/TestTasks/__init__.py → perception/tasks/cross/__init__.py b/perception/tasks/TestTasks/__init__.py → perception/tasks/cross/__init__.py
diff --git a/perception/tasks/cross/cross_detection.py b/perception/tasks/cross/cross_detection.py
@@ -8,10 +8,10 @@
 #############################################################################
 
 sys.path.insert(0, '../background_removal')
-from peak_removal_adaptive_thresholding import filter_out_highest_peak_multidim
-from combined_filter import combined_filter
+from perception.tasks.segmentation.peak_removal_adaptive_thresholding import filter_out_highest_peak_multidim
+from perception.tasks.segmentation.combinedFilter import init_combined_filter
 
-ret, frame = True, cv2.imread('../data/cross/cross.png') # https://i.imgur.com/rjv1Vcy.png
+ret, frame = True, cv2.imread('../data/cross/cross.png')  # https://i.imgur.com/rjv1Vcy.png
 
 # "hsv" = Apply hsv thresholding before trying to find the path marker
 # "multidim" = Apply filter_out_highest_peak_multidim
@@ -29,7 +29,7 @@ def find_cross(frame, draw_figs=True):
     gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
 
     ret, thresh = cv2.threshold(gray, 127, 255,0)
-    __, contours,hierarchy = cv2.findContours(thresh,cv2.RETR_TREE,cv2.CHAIN_APPROX_SIMPLE)
+    __, contours,hierarchy = cv2.findContours(thresh, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
     contours.sort(key=lambda c: cv2.contourArea(c), reverse=True)
 
     possible_crosses = []
@@ -44,17 +44,16 @@ def find_cross(frame, draw_figs=True):
         if defects is not None and len(defects) == 4:
             possible_crosses.append(defects)
 
-
     if draw_figs:
         img = frame.copy()
         for defects in possible_crosses:
             for i in range(defects.shape[0]):
-                s,e,f,d = defects[i,0]
+                s, e, f, d = defects[i, 0]
                 # start = tuple(cnt[s][0])
                 # end = tuple(cnt[e][0])
                 far = tuple(cnt[f][0])
                 # cv2.line(img,start,end,[0,255,0],2)
-                cv2.circle(img,far,5,[0,0,255],-1)
+                cv2.circle(img, far, 5, [0, 0, 255], -1)
             cv2.imshow('cross at contour number ' + str(i),img)
         cv2.imshow('original', frame)
 
@@ -64,15 +63,15 @@ def find_cross(frame, draw_figs=True):
 ###########################################
 # Main Body
 ###########################################
-
+# TODO: port to vis
 if __name__ == "__main__":
+    combined_filter = init_combined_filter()
+
     ret_tries = 0
-    while(1 and ret_tries < 50):
+    while 1 and ret_tries < 50:
         # ret,frame = cap.read()
-
-        if ret == True:
+        if ret:
             # frame = cv2.resize(frame, (0,0), fx=0.5, fy=0.5)
-
             if thresholding == "multidim":
                 votes1, threshed = filter_out_highest_peak_multidim(frame)
                 threshed = cv2.morphologyEx(threshed, cv2.MORPH_OPEN, np.ones((5,5),np.uint8))
@@ -86,13 +85,9 @@ def find_cross(frame, draw_figs=True):
 
             ret_tries = 0
             k = cv2.waitKey(60) & 0xff
-            if k == 27: # esc
-                if testing:
-                    print("hsv thresholds:")
-                    print(thresholds_used)
+            if k == 27:  # esc
                 break
         else:
             ret_tries += 1
 
     cv2.destroyAllWindows()
-    cap.release()
diff --git a/perception/tasks/gate/GateCenter.py → perception/tasks/gate/GateCenterAlgo.py b/perception/tasks/gate/GateCenter.py → perception/tasks/gate/GateCenterAlgo.py
@@ -1,16 +1,14 @@
-from perception.tasks.gate.GateSegmentation import GateSegmentationAlgo
+from perception.tasks.gate.GateSegmentationAlgoA import GateSegmentationAlgoA
 from perception.tasks.TaskPerceiver import TaskPerceiver
 from collections import namedtuple
-import sys
 
 import numpy as np
 import math
 import cv2 as cv
-import time
 import statistics
 
 
-class GateCenter(TaskPerceiver):
+class GateCenterAlgo(TaskPerceiver):
     center_x_locs, center_y_locs = [], []
     output_class = namedtuple("GateOutput", ["centerx", "centery"])
     output_type = {'centerx': np.int16, 'centery': np.int16}
@@ -20,39 +18,43 @@ def __init__(self):
         self.gate_center = self.output_class(250, 250)
         self.use_optical_flow = False
         self.optical_flow_c = 0.1
-        self.gate = GateSegmentationAlgo()
+        self.gate = GateSegmentationAlgoA()
         self.prvs = None
 
+    # TODO: do input and return typing
     def analyze(self, frame, debug, slider_vals):
-        self.optical_flow_c = slider_vals['optical_flow_c'] / 100
-        rect1, rect2, debug_filter = self.gate.analyze(frame, True)
+        self.optical_flow_c = slider_vals['optical_flow_c']/100
+        rect, debug_filters = self.gate.analyze(frame, True)
+        debug_filter = debug_filters[-1]
+        debug_filters = debug_filters[:-1]
+
         if self.prvs is None:
             # frame = cv.resize(frame, None, fx=0.3, fy=0.3)
             self.prvs = cv.cvtColor(frame, cv.COLOR_BGR2GRAY)
-        else:
-            if rect1 and rect2:
-                self.gate_center = self.get_center(rect1, rect2, frame)
+        else: 
+            if rect[0] and rect[1]:
+                self.gate_center = self.get_center(rect[0], rect[1], frame)
                 if self.use_optical_flow:
-                    cv.circle(debug_filter, self.gate_center, 5, (3, 186, 252), -1)
+                    cv.circle(debug_filter, self.gate_center, 5, (3,186,252), -1)
                 else:
-                    cv.circle(debug_filter, self.gate_center, 5, (0, 0, 255), -1)
-
+                    cv.circle(debug_filter, self.gate_center, 5, (0,0,255), -1)
+        
         if debug:
-            return (self.output_class(self.gate_center[0], self.gate_center[1]), [frame, debug_filter])
-        return self.output_class(self.gate_center[0], self.gate_center[1])
+            return (self.gate_center[0], self.gate_center[1]), list(debug_filters) + [debug_filter]
+        return (self.gate_center[0], self.gate_center[1])
 
     def center_without_optical_flow(self, center_x, center_y):
         # get starting center location, averaging over the first 2510 frames
         if len(self.center_x_locs) == 0:
             self.center_x_locs.append(center_x)
             self.center_y_locs.append(center_y)
-
+            
         elif len(self.center_x_locs) < 25:
             self.center_x_locs.append(center_x)
             self.center_y_locs.append(center_y)
             center_x = int(statistics.mean(self.center_x_locs))
             center_y = int(statistics.mean(self.center_y_locs))
-
+        
         # use new center location only when it is close to the previous valid location
         else:
             self.center_x_locs.append(center_x)
@@ -61,11 +63,11 @@ def center_without_optical_flow(self, center_x, center_y):
             self.center_y_locs.pop(0)
             x_temp_avg = int(statistics.mean(self.center_x_locs))
             y_temp_avg = int(statistics.mean(self.center_y_locs))
-            if math.sqrt((center_x - x_temp_avg) ** 2 + (center_y - y_temp_avg) ** 2) > 10:
+            if math.sqrt((center_x - x_temp_avg)**2 + (center_y - y_temp_avg)**2) > 10:
                 center_x, center_y = int(x_temp_avg), int(y_temp_avg)
-
+                
         return (center_x, center_y)
-
+    
     def dense_optical_flow(self, frame):
         next_frame = cv.cvtColor(frame, cv.COLOR_BGR2GRAY)
         flow = cv.calcOpticalFlowFarneback(self.prvs, next_frame, None, 0.5, 3, 15, 3, 5, 1.2, 0)
@@ -82,53 +84,16 @@ def get_center(self, rect1, rect2, frame):
         x2, y2, w2, h2 = rect2
         center_x, center_y = (x1 + x2) // 2, ((y1 + h1 // 2) + (y2 + h2 // 2)) // 2
         self.prvs, mag, ang = self.dense_optical_flow(frame)
-        # print(np.mean(mag))
-        if len(self.center_x_locs) < 25 or (np.mean(mag) < 40 and ((not self.use_optical_flow) or \
-                                                                   (self.use_optical_flow and (
-                                                                           center_x - self.gate_center[0]) ** 2 + (
-                                                                            center_y - self.gate_center[
-                                                                        1]) ** 2 < 50))):
+
+        if len(self.center_x_locs) < 25 or (np.mean(mag) < 40 and ((not self.use_optical_flow ) or \
+            (self.use_optical_flow and (center_x - self.gate_center[0])**2 + (center_y - self.gate_center[1])**2 < 50))):
             self.use_optical_flow = False
             return self.center_without_optical_flow(center_x, center_y)
         self.use_optical_flow = True
         return (int(self.gate_center[0] + self.optical_flow_c * np.mean(mag * np.cos(ang))), \
                 (int(self.gate_center[1] + self.optical_flow_c * np.mean(mag * np.sin(ang)))))
 
 
-# this part is temporary and will be covered by other files in the future
 if __name__ == '__main__':
-    cap = cv.VideoCapture(sys.argv[1])
-    ret_tries = 0
-    start_time = time.time()
-    frame_count = 0
-    paused = False
-    speed = 1
-    ret, frame1 = cap.read()
-    frame1 = cv.resize(frame1, None, fx=0.3, fy=0.3)
-    prvs = cv.cvtColor(frame1, cv.COLOR_BGR2GRAY)
-    hsv = np.zeros_like(frame1)
-    hsv[..., 1] = 255
-    gate_center = GateCenter()
-    while ret_tries < 50:
-        for _ in range(speed):
-            ret, frame = cap.read()
-        if frame_count == 1000:
-            break
-        if ret:
-            frame = cv.resize(frame, None, fx=0.3, fy=0.3)
-            center, filtered_frame = gate_center.analyze(frame, True)
-            cv.imshow('original', frame)
-            cv.imshow('filtered_frame', filtered_frame)
-            ret_tries = 0
-            key = cv.waitKey(30)
-            if key == ord('q') or key == 27:
-                break
-            if key == ord('p'):
-                paused = not paused
-            if key == ord('i') and speed > 1:
-                speed -= 1
-            if key == ord('o'):
-                speed += 1
-        else:
-            ret_tries += 1
-        frame_count += 1
+    from perception.vis.vis import run
+    run(['..\..\..\data\GOPR1142.MP4'], GateCenterAlgo(), False)
-Original file line number
+Diff line change
@@ Expand Up / @@ -18,3 +18,5 @@ __pycache__/ @@
     # IDE files
     .idea
     .vs_code/
+    data/