Docs cleanup and Google-style tracker docstrings (#6751)

Signed-off-by: Glenn Jocher <glenn.jocher@ultralytics.com> Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
2023-12-03 04:12:33 +01:00 · 2023-12-03 04:12:33 +01:00 · 80802be1e5
commit 80802be1e5
parent 60041014a8
44 changed files with 740 additions and 529 deletions
--- a/ultralytics/trackers/utils/gmc.py
+++ b/ultralytics/trackers/utils/gmc.py
@ -13,7 +13,7 @@ class GMC:
    Generalized Motion Compensation (GMC) class for tracking and object detection in video frames.

    This class provides methods for tracking and detecting objects based on several tracking algorithms including ORB,
-    SIFT, ECC, and Sparse Optical Flow. It also supports downscaling of  frames for computational efficiency.
+    SIFT, ECC, and Sparse Optical Flow. It also supports downscaling of frames for computational efficiency.

    Attributes:
        method (str): The method used for tracking. Options include 'orb', 'sift', 'ecc', 'sparseOptFlow', 'none'.
@ -33,8 +33,14 @@ class GMC:
        applySparseOptFlow(self, raw_frame, detections=None): Applies the Sparse Optical Flow method to a raw frame.
    """

-    def __init__(self, method='sparseOptFlow', downscale=2):
-        """Initialize a video tracker with specified parameters."""
+    def __init__(self, method: str = 'sparseOptFlow', downscale: int = 2) -> None:
+        """
+        Initialize a video tracker with specified parameters.
+
+        Args:
+            method (str): The method used for tracking. Options include 'orb', 'sift', 'ecc', 'sparseOptFlow', 'none'.
+            downscale (int): Downscale factor for processing frames.
+        """
        super().__init__()

        self.method = method
@ -72,11 +78,25 @@ class GMC:
        self.prevFrame = None
        self.prevKeyPoints = None
        self.prevDescriptors = None
-
        self.initializedFirstFrame = False

-    def apply(self, raw_frame, detections=None):
-        """Apply object detection on a raw frame using specified method."""
+    def apply(self, raw_frame: np.array, detections: list = None) -> np.array:
+        """
+        Apply object detection on a raw frame using specified method.
+
+        Args:
+            raw_frame (np.array): The raw frame to be processed.
+            detections (list): List of detections to be used in the processing.
+
+        Returns:
+            np.array: Processed frame.
+
+        Examples:
+            >>> gmc = GMC()
+            >>> gmc.apply(np.array([[1, 2, 3], [4, 5, 6]]))
+            array([[1, 2, 3],
+                   [4, 5, 6]])
+        """
        if self.method in ['orb', 'sift']:
            return self.applyFeatures(raw_frame, detections)
        elif self.method == 'ecc':
@ -86,13 +106,28 @@ class GMC:
        else:
            return np.eye(2, 3)

-    def applyEcc(self, raw_frame, detections=None):
-        """Initialize."""
+    def applyEcc(self, raw_frame: np.array, detections: list = None) -> np.array:
+        """
+        Apply ECC algorithm to a raw frame.
+
+        Args:
+            raw_frame (np.array): The raw frame to be processed.
+            detections (list): List of detections to be used in the processing.
+
+        Returns:
+            np.array: Processed frame.
+
+        Examples:
+            >>> gmc = GMC()
+            >>> gmc.applyEcc(np.array([[1, 2, 3], [4, 5, 6]]))
+            array([[1, 2, 3],
+                   [4, 5, 6]])
+        """
        height, width, _ = raw_frame.shape
        frame = cv2.cvtColor(raw_frame, cv2.COLOR_BGR2GRAY)
        H = np.eye(2, 3, dtype=np.float32)

-        # Downscale image (TODO: consider using pyramids)
+        # Downscale image
        if self.downscale > 1.0:
            frame = cv2.GaussianBlur(frame, (3, 3), 1.5)
            frame = cv2.resize(frame, (width // self.downscale, height // self.downscale))
@ -118,22 +153,35 @@ class GMC:

        return H

-    def applyFeatures(self, raw_frame, detections=None):
-        """Initialize."""
+    def applyFeatures(self, raw_frame: np.array, detections: list = None) -> np.array:
+        """
+        Apply feature-based methods like ORB or SIFT to a raw frame.
+
+        Args:
+            raw_frame (np.array): The raw frame to be processed.
+            detections (list): List of detections to be used in the processing.
+
+        Returns:
+            np.array: Processed frame.
+
+        Examples:
+            >>> gmc = GMC()
+            >>> gmc.applyFeatures(np.array([[1, 2, 3], [4, 5, 6]]))
+            array([[1, 2, 3],
+                   [4, 5, 6]])
+        """
        height, width, _ = raw_frame.shape
        frame = cv2.cvtColor(raw_frame, cv2.COLOR_BGR2GRAY)
        H = np.eye(2, 3)

-        # Downscale image (TODO: consider using pyramids)
+        # Downscale image
        if self.downscale > 1.0:
-            # frame = cv2.GaussianBlur(frame, (3, 3), 1.5)
            frame = cv2.resize(frame, (width // self.downscale, height // self.downscale))
            width = width // self.downscale
            height = height // self.downscale

        # Find the keypoints
        mask = np.zeros_like(frame)
-        # mask[int(0.05 * height): int(0.95 * height), int(0.05 * width): int(0.95 * width)] = 255
        mask[int(0.02 * height):int(0.98 * height), int(0.02 * width):int(0.98 * width)] = 255
        if detections is not None:
            for det in detections:
@ -157,10 +205,10 @@ class GMC:

            return H

-        # Match descriptors.
+        # Match descriptors
        knnMatches = self.matcher.knnMatch(self.prevDescriptors, descriptors, 2)

-        # Filtered matches based on smallest spatial distance
+        # Filter matches based on smallest spatial distance
        matches = []
        spatialDistances = []

@ -244,15 +292,29 @@ class GMC:

        return H

-    def applySparseOptFlow(self, raw_frame, detections=None):
-        """Initialize."""
+    def applySparseOptFlow(self, raw_frame: np.array, detections: list = None) -> np.array:
+        """
+        Apply Sparse Optical Flow method to a raw frame.
+
+        Args:
+            raw_frame (np.array): The raw frame to be processed.
+            detections (list): List of detections to be used in the processing.
+
+        Returns:
+            np.array: Processed frame.
+
+        Examples:
+            >>> gmc = GMC()
+            >>> gmc.applySparseOptFlow(np.array([[1, 2, 3], [4, 5, 6]]))
+            array([[1, 2, 3],
+                   [4, 5, 6]])
+        """
        height, width, _ = raw_frame.shape
        frame = cv2.cvtColor(raw_frame, cv2.COLOR_BGR2GRAY)
        H = np.eye(2, 3)

        # Downscale image
        if self.downscale > 1.0:
-            # frame = cv2.GaussianBlur(frame, (3, 3), 1.5)
            frame = cv2.resize(frame, (width // self.downscale, height // self.downscale))

        # Find the keypoints
@ -260,13 +322,9 @@ class GMC:

        # Handle first frame
        if not self.initializedFirstFrame:
-            # Initialize data
            self.prevFrame = frame.copy()
            self.prevKeyPoints = copy.copy(keypoints)
-
-            # Initialization done
            self.initializedFirstFrame = True
-
            return H

        # Find correspondences
@ -285,23 +343,21 @@ class GMC:
        currPoints = np.array(currPoints)

        # Find rigid matrix
-        if (np.size(prevPoints, 0) > 4) and (np.size(prevPoints, 0) == np.size(prevPoints, 0)):
+        if np.size(prevPoints, 0) > 4 and np.size(prevPoints, 0) == np.size(prevPoints, 0):
            H, inliers = cv2.estimateAffinePartial2D(prevPoints, currPoints, cv2.RANSAC)

-            # Handle downscale
            if self.downscale > 1.0:
                H[0, 2] *= self.downscale
                H[1, 2] *= self.downscale
        else:
            LOGGER.warning('WARNING: not enough matching points')

-        # Store to next iteration
        self.prevFrame = frame.copy()
        self.prevKeyPoints = copy.copy(keypoints)

        return H

-    def reset_params(self):
+    def reset_params(self) -> None:
        """Reset parameters."""
        self.prevFrame = None
        self.prevKeyPoints = None