meanshift, camshift & optical flow

mpolinowski · mpolinowski · commit b4446974b1a6 · 2022-02-20T12:04:29.000+08:00
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,3 @@
- 
+resources
 recordings
 .idea
diff --git a/README.md b/README.md
@@ -0,0 +1,13 @@
+# OpenCV2 Object Tracking
+
+## Meanshift Algorithm
+
+[OpenCV Meanshift Algorithm for Object Tracking](https://mpolinowski.github.io/devnotes/2021-12-08--opencv-meanshift-tracking)
+
+## CAMshift Algorithm
+
+[OpenCV CAMshift Algorithm for Object Tracking](https://mpolinowski.github.io/devnotes/2021-12-09--opencv-camshift-tracking)
+
+## Optical Flow Algorithm (Sparse & Dense)
+
+[OpenCV Optical Flow Algorithm for Object Tracking](https://mpolinowski.github.io/devnotes/2021-12-10--opencv-optical-flow-tracking)
diff --git a/scripts/camshift_tracking.py b/scripts/camshift_tracking.py
@@ -0,0 +1,69 @@
+# Usage
+# python scripts/meanshift_tracking.py -u 'rtsp://admin:instar@192.168.2.19/livestream/13'
+import numpy as np
+import cv2
+#from matplotlib import pyplot as plt
+import argparse
+# from imutils import resize
+from imutils.video import VideoStream
+import time
+
+# Parse the arguments
+ap = argparse.ArgumentParser()
+ap.add_argument("-u", "--url", help="RTSP streaming URL", default="rtsp://admin:instar@192.168.2.19/livestream/13")
+args = vars(ap.parse_args())
+
+# get video stream from IP camera
+print("[INFO] starting video stream")
+vs = VideoStream(args["url"]).start()
+
+# first frame from stream
+frame = vs.read()
+# optional - resize image if source too high res
+# frame = resize(frame, width=1280)
+# select region of interest
+bbox = cv2.selectROI(frame)
+x, y, w, h = bbox
+track_window = (x, y, w, h)
+# define area of bounding box as area of interest
+roi = frame[y:y+h, x:x+w]
+# convert frame to HSV colour space
+hsv_roi = cv2.cvtColor(roi, cv2.COLOR_BGR2HSV)
+# get histogram for [0] blue, [1] green, [2] red channel
+# https://docs.opencv.org/4.x/d1/db7/tutorial_py_histogram_begins.html
+roi_hist = cv2.calcHist([hsv_roi], [0], None, [180], [0, 180])
+# convert hist values 0-180 to a range between 0-1
+roi_hist = cv2.normalize(roi_hist, roi_hist, 0, 255, cv2.NORM_MINMAX)
+# set up the termination criteria, either 10 iteration or move by at least 1 pt
+parameter = (cv2.TERM_CRITERIA_EPS | cv2.TERM_CRITERIA_COUNT, 10, 1)
+
+# now loop through the rest of avail frames
+# and use camshift to track defined roi
+while True:
+    # get next frame
+    frame = vs.read()
+    if True:
+        # convert to hsv
+        hsv = cv2.cvtColor(frame, cv2.COLOR_BGR2HSV)
+        # compare blue channel of current with roi histogram
+        # https://docs.opencv.org/3.4.15/da/d7f/tutorial_back_projection.html
+        dst = cv2.calcBackProject([hsv], [0], roi_hist, [0, 180], 1)
+        # call camshift() to find match of histogram in current frame
+        # and get the new coordinates
+        ok, track_window = cv2.CamShift(dst, (x, y, w, h), parameter)
+        if not ok:
+            print('[WARNING] track lost')
+        # take the updated coordinates
+        pts = cv2.boxPoints(ok)
+        pts = np.int0(pts)
+        # use coordinates to draw polylines
+        output = cv2.polylines(frame, [pts], True, 255, 5)
+        # display track
+        cv2.imshow("CAMshift Track", output)
+        if cv2.waitKey(1) & 0xFF == ord('q'):
+            break
+    else:
+        break
+
+
+cv2.destroyAllWindows()
diff --git a/scripts/meanshift_tracking.py b/scripts/meanshift_tracking.py
@@ -1,7 +1,7 @@
 # Usage
 # python scripts/meanshift_tracking.py -u 'rtsp://admin:instar@192.168.2.19/livestream/13'
 import cv2
-from matplotlib import pyplot as plt
+# from matplotlib import pyplot as plt
 import argparse
 # from imutils import resize
 from imutils.video import VideoStream
@@ -65,7 +65,7 @@
             print('[WARNING] track lost')
         # now update the roi coordinates to new values
         x, y, w, h = track_window
-        cv2.rectangle(frame, (x, y), (x+w, y+h), (0, 255, 255), 5)
+        cv2.rectangle(frame, (x, y), (x+w, y+h), (0, 255, 255), 2)
         # display track
         cv2.imshow("Meanshift Track", frame)
         if cv2.waitKey(1) & 0xFF == ord('q'):
@@ -74,4 +74,4 @@
         break
 
 
-cv2.destroyAllWindows()
+cv2.destroyAllWindows()
diff --git a/scripts/optical_flow_dense.py b/scripts/optical_flow_dense.py
@@ -0,0 +1,69 @@
+# Usage
+# python scripts/optical_flow_sparse_manual.py -p 'resources/car_race_01.mp4'
+import datetime
+import sys
+
+import cv2
+import argparse
+import numpy as np
+
+# Parse the arguments
+ap = argparse.ArgumentParser()
+ap.add_argument("-p", "--path", help="Path to video file", default="resources/car_race_02.mp4")
+args = vars(ap.parse_args())
+
+cap = cv2.VideoCapture(args["path"])
+if not cap.isOpened():
+    print("[ERROR] opening video file")
+    sys.exit()
+
+# Optional recording parameter
+frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+fps = int(cap.get(cv2.CAP_PROP_FPS))
+video_codec = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
+prefix = 'recordings/'+datetime.datetime.now().strftime("%y%m%d_%H%M%S")
+basename = "object_track.mp4"
+video_output = cv2.VideoWriter("_".join([prefix, basename]), video_codec, fps, (frame_width, frame_height))
+
+ok, first_frame = cap.read()
+if not ok:
+    print("[ERROR] getting frame from video")
+    sys.exit()
+frame_gray_init = cv2.cvtColor(first_frame, cv2.COLOR_BGR2GRAY)
+
+# create canvas to paint on
+hsv_canvas = np.zeros_like(first_frame)
+# set saturation value (position 2 in HSV space) to 255
+hsv_canvas[..., 1] = 255
+
+while True:
+    # get next frame
+    ok, frame = cap.read()
+    if not ok:
+        print("[ERROR] reached end of file")
+        break
+    frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+    # compare initial frame with current frame
+    flow = cv2.calcOpticalFlowFarneback(frame_gray_init, frame_gray, None, 0.5, 3, 15, 3, 5, 1.1, 0)
+    # get x and y coordinates
+    magnitude, angle = cv2.cartToPolar(flow[..., 0], flow[..., 1])
+    # set hue of HSV canvas (position 1)
+    hsv_canvas[..., 0] = angle*(180/(np.pi/2))
+    # set pixel intensity value (position 3
+    hsv_canvas[..., 2] = cv2.normalize(magnitude, None, 0, 255, cv2.NORM_MINMAX)
+
+    frame_rgb = cv2.cvtColor(hsv_canvas, cv2.COLOR_HSV2BGR)
+
+    # optional recording result/mask
+    video_output.write(frame_rgb)
+
+    cv2.imshow('Optical Flow (dense)', frame_rgb)
+    if cv2.waitKey(1) & 0xFF == ord('q'):
+        break
+
+    # set initial frame to current frame
+    frame_gray_init = frame_gray
+
+cv2.destroyAllWindows()
+cap.release()
diff --git a/scripts/optical_flow_sparse_auto.py b/scripts/optical_flow_sparse_auto.py
@@ -0,0 +1,94 @@
+# Usage
+# python scripts/optical_flow_sparse_manual.py -p 'resources/car_race_01.mp4'
+import datetime
+import sys
+import numpy as np
+import cv2
+import argparse
+
+# Parse the arguments
+ap = argparse.ArgumentParser()
+ap.add_argument("-p", "--path", help="Path to video file", default="resources/car_race_02.mp4")
+args = vars(ap.parse_args())
+
+cap = cv2.VideoCapture(args["path"])
+if not cap.isOpened():
+    print("[ERROR] cannot open video file")
+    sys.exit()
+
+# generate initial corners of detected object
+# set limit, minimum distance in pixels and quality of object corner to be tracked
+parameters_shitomasi = dict(maxCorners=100, qualityLevel=0.3, minDistance=7)
+# set min size of tracked object, e.g. 15x15px
+parameter_lucas_kanade = dict(winSize=(15, 15), maxLevel=2, criteria=(cv2.TERM_CRITERIA_EPS |
+                                                                      cv2.TERM_CRITERIA_COUNT, 10, 0.03))
+# create random colours for visualization for all 100 max corners for RGB channels
+colours = np.random.randint(0, 255, (100, 3))
+
+# get first video frame
+ok, frame = cap.read()
+if not ok:
+    print("[ERROR] cannot get frame from video")
+    sys.exit()
+# convert to grayscale
+frame_gray_init = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+
+# Use optical flow to detect object corners / edges from initial frame
+edges = cv2.goodFeaturesToTrack(frame_gray_init, mask = None, **parameters_shitomasi)
+# [Debug] show amount of found edges
+# max value = maxCorners see above. Reduce qualityLevel to get more hits
+# print(len(edges))
+
+# create a black canvas the size of the initial frame
+canvas = np.zeros_like(frame)
+
+# Optional recording parameter
+frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+fps = int(cap.get(cv2.CAP_PROP_FPS))
+video_codec = cv2.VideoWriter_fourcc('m', 'p', '4', 'v')
+prefix = 'recordings/'+datetime.datetime.now().strftime("%y%m%d_%H%M%S")
+basename = "object_track.mp4"
+video_output = cv2.VideoWriter("_".join([prefix, basename]), video_codec, fps, (frame_width, frame_height))
+
+# loop through the remaining frames of the video
+# and apply algorithm to track selected objects
+while True:
+    # get next frame
+    ok, frame = cap.read()
+    if not ok:
+        print("[INFO] end of file reached")
+        break
+    # prepare grayscale image
+    frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+    # update object corners by comparing with found edges in initial frame
+    update_edges, status, errors = cv2.calcOpticalFlowPyrLK(frame_gray_init, frame_gray, edges, None,
+                                                         **parameter_lucas_kanade)
+    # only update edges if algorithm successfully tracked
+    new_edges = update_edges[status == 1]
+    # to calculate directional flow we need to compare with previous position
+    old_edges = edges[status == 1]
+
+    for i, (new, old) in enumerate(zip(new_edges, old_edges)):
+        a, b = new.ravel()
+        c, d = old.ravel()
+
+        # draw line between old and new corner point with random colour
+        mask = cv2.line(canvas, (int(a), int(b)), (int(c), int(d)), colours[i].tolist(), 2)
+        # draw circle around new position
+        frame = cv2.circle(frame, (int(a), int(b)), 5, colours[i].tolist(), -1)
+
+    result = cv2.add(frame, mask)
+    # optional recording result/mask
+    # video_output.write(result)
+    cv2.imshow('Optical Flow (sparse)', result)
+    if cv2.waitKey(1) & 0xFF == ord('q'):
+        break
+    # overwrite initial frame with current before restarting the loop
+    frame_gray_init = frame_gray.copy()
+    # update to new edges before restarting the loop
+    edges = new_edges.reshape(-1, 1, 2)
+
+
+cv2.destroyAllWindows()
+cap.release()
diff --git a/scripts/optical_flow_sparse_manual.py b/scripts/optical_flow_sparse_manual.py
@@ -0,0 +1,86 @@
+# Usage
+# python scripts/optical_flow_sparse_manual.py -u 'rtsp://admin:instar@192.168.2.19/livestream/13'
+# Click on video to select point to track
+import sys
+import numpy as np
+import cv2
+import argparse
+from imutils.video import VideoStream
+
+# Parse the arguments
+ap = argparse.ArgumentParser()
+ap.add_argument("-u", "--url", help="RTSP streaming URL", default="rtsp://admin:instar@192.168.2.19/livestream/12")
+args = vars(ap.parse_args())
+
+# get video stream from IP camera
+print("[INFO] starting video stream")
+vs = VideoStream(args["url"]).start()
+
+# first frame from stream
+frame = vs.read()
+
+# convert to grayscale
+frame_gray_init = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+
+# set min size of tracked object, e.g. 15x15px
+parameter_lucas_kanade = dict(winSize=(15, 15), maxLevel=4, criteria=(cv2.TERM_CRITERIA_EPS |
+                                                                      cv2.TERM_CRITERIA_COUNT, 10, 0.03))
+
+
+# define function to manually select object to track
+def select_point(event, x, y, flags, params):
+    global point, selected_point, old_points
+    # record coordinates of mouse click
+    if event == cv2.EVENT_LBUTTONDOWN:
+        point = (x, y)
+        selected_point = True
+        old_points = np.array([[x, y]], dtype=np.float32)
+
+
+# associate select function with window Selector
+cv2.namedWindow('Optical Flow')
+cv2.setMouseCallback('Optical Flow', select_point)
+
+# initialize variables updated by function
+selected_point = False
+point = ()
+old_points = ([[]])
+
+# create a black canvas the size of the initial frame
+canvas = np.zeros_like(frame)
+
+# loop through the remaining frames of the video
+# and apply algorithm to track selected objects
+while True:
+    # get next frame
+    frame = vs.read()
+    # covert to grayscale
+    frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+
+    if selected_point is True:
+        cv2.circle(frame, point, 5, (0, 0, 255), 2)
+        # update object corners by comparing with found edges in initial frame
+        new_points, status, errors = cv2.calcOpticalFlowPyrLK(frame_gray_init, frame_gray, old_points, None,
+                                                         **parameter_lucas_kanade)
+
+        # overwrite initial frame with current before restarting the loop
+        frame_gray_init = frame_gray.copy()
+        # update to new edges before restarting the loop
+        old_points = new_points
+
+        x, y = new_points.ravel()
+        j, k = old_points.ravel()
+
+        # draw line between old and new corner point with random colour
+        canvas = cv2.line(canvas, (int(x), int(y)), (int(j), int(k)), (0, 255, 0), 3)
+        # draw circle around new position
+        frame = cv2.circle(frame, (int(x), int(y)), 5, (0, 255, 0), -1)
+
+    result = cv2.add(frame, canvas)
+    cv2.imshow('Optical Flow', result)
+    if cv2.waitKey(1) & 0xFF == ord('q'):
+        break
+
+
+cv2.destroyAllWindows()
+sys.exit()

-Original file line number
+Diff line change
@@ @@ -1,3 +1,3 @@ @@
+-
 +resources
 recordings
 .idea