如何在图像中跟踪我们想要的任何特定对象?

How to Track any specific object that we want in an image?

我想在视频帧中跟踪我想要的任何对象,而不需要任何对象检测算法,如 haar-cascade、faster-RCNN、SSD 或 YOLO。 我怎样才能做到这一点?请推荐我任何方法。

我使用了 OpenCV 跟踪 API 正如 Adrian 在这里指出的 https://www.pyimagesearch.com/2018/08/06/tracking-multiple-objects-with-opencv/

但是,我想制作更复杂的跟踪器。 开发人员可以向我推荐任何算法或其他 API 吗?

你提到的算法可能是最好的选择。 顺便说一句,如果你有一些你想找的对象的图像,你可以尝试使用

SIFT points (a.k.a. SURF points in Matlab)

然后给自己写一个检测器。

您可能会发现比例因子和可能的计算时间存在一些问题,但我认为您可以尝试使用此技术。

import numpy as np
import cv2
import copy

class selectROI():

    def __init__(self):
        self.refPt = []
        self.clickEventsEnabled = False
        self.drawingRectangle = False
        self.rectangleDrawn = False
        self.x_start = -1
        self.y_start = -1
        self.ref_frame = None

    def clickPolygonPoints(self, event, x, y, flags, param):

        temp_frame = self.ref_frame.copy()

        if(self.clickEventsEnabled == True):
                if event == cv2.EVENT_LBUTTONDOWN:
                        if((self.rectangleDrawn == False)):
                            self.drawingRectangle = True
                            self.x_start,self.y_start = x,y
                            self.refPt.append((x,y))

                elif event ==  cv2.EVENT_MOUSEMOVE: 
                        if(self.drawingRectangle == True):
                            cv2.rectangle(temp_frame, (self.x_start,self.y_start), (x,y), (0,0,255), 2)
                            cv2.imshow("ref_frame", temp_frame)
                            temp_frame = self.ref_frame

                elif event == cv2.EVENT_LBUTTONUP:
                        if((self.rectangleDrawn == False)):
                            self.drawingRectangle = False
                            self.rectangleDrawn = True
                            cv2.rectangle(self.ref_frame, (self.x_start, self.y_start), (x,y), (0,0,255), 2)
                            self.refPt.append((self.x_start, self.y_start))
                            self.refPt.append((x, self.y_start))
                            self.refPt.append((x, y))
                            self.refPt.append((self.x_start, y))

                            roiPoints = [(self.x_start, self.y_start), (x, y)]

                            if len(roiPoints) == 2: #when two points were found
                                    roi = self.ref_frame[roiPoints[0][1]:roiPoints[1][1], roiPoints[0][0]:roiPoints[1][0]]
                                    cv2.imshow("Cropped", roi)


    def maskImg_WithROI(self, frame, ROIPointsList):
            pointsArray = np.array(ROIPointsList)
            mask = np.zeros(frame.shape, dtype=np.uint8)
            white = (255,255,255)
            cv2.fillPoly(mask, np.int32([pointsArray]), white)
            maskedImage = cv2.bitwise_and(frame, mask)
            return maskedImage  

    def outputROIMask(self, frame, ROIPointsList):
            pointsArray = np.array(ROIPointsList)
            pointsArray = pointsArray.reshape((-1,1,2))
            mask = np.zeros(frame.shape, dtype=np.uint8)
            white = (255,255,255)
            cv2.fillPoly(mask, np.int32([pointsArray]), white)
            return mask  

    def main(self):

            self.clickEventsEnabled = True

            self.ref_frame = cv2.imread('picture.png')
            originalRef_Frame = self.ref_frame.copy()

            cv2.namedWindow("ref_frame")
            cv2.setMouseCallback("ref_frame", self.clickPolygonPoints)

            while True:

                    cv2.imshow("ref_frame", self.ref_frame)

                    key = cv2.waitKey(0) & 0xFF

                    if key == ord("r"):
                         self.ref_frame = originalRef_Frame.copy()
                         self.refPt = []
                         self.drawingRectangle = False
                         self.rectangleDrawn = False
                         self.x_start, self.y_start = -1,-1

                    elif key == ord("p"):
                         self.clickEventsEnabled = False
                         self.ref_frame = originalRef_Frame.copy()
                         self.drawingRectangle = False
                         self.rectangleDrawn = False
                         break

                    elif key == ord("q"):
                            break

            self.ref_frame = self.maskImg_WithROI(self.ref_frame, self.refPt)
            cv2.imshow("ref_frame", self.ref_frame)

            roiMask = self.outputROIMask(self.ref_frame, self.refPt)
            cv2.imwrite("ROI.jpg", roiMask)

            cv2.waitKey(0)
            cv2.destroyAllWindows()

if __name__ == '__main__':
    selROI = selectROI()
    selROI.main()`