AugusZhan
diff --git a/‎run_yolov7.txt‎
Lines changed: 2 additions & 1 deletion b/‎run_yolov7.txt‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎tracker/__pycache__/basetrack.cpython-37.pyc‎
169 Bytes b/‎tracker/__pycache__/basetrack.cpython-37.pyc‎
169 Bytes
diff --git a/‎tracker/__pycache__/deepsort.cpython-37.pyc‎
1.36 KB b/‎tracker/__pycache__/deepsort.cpython-37.pyc‎
1.36 KB
diff --git a/‎tracker/__pycache__/matching.cpython-37.pyc‎
-245 Bytes b/‎tracker/__pycache__/matching.cpython-37.pyc‎
-245 Bytes
diff --git a/‎tracker/basetrack.py‎
Lines changed: 10 additions & 1 deletion b/‎tracker/basetrack.py‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎tracker/deepsort.py‎
Lines changed: 44 additions & 16 deletions b/‎tracker/deepsort.py‎
Lines changed: 44 additions & 16 deletions
diff --git a/‎tracker/matching.py‎
Lines changed: 80 additions & 77 deletions b/‎tracker/matching.py‎
Lines changed: 80 additions & 77 deletions
@@ -60,4 +60,5 @@ CUDA_VISIBLE_DEVICES=0 python train_aux.py --dataset mot17 --workers 8 --device
 
 track:
 python tracker/track.py --dataset mot17 --data_format yolo --tracker sort --model_path runs/train/yolov7-w6-custom3/weights/best.pt --save_images
-python tracker/track.py --dataset mot17 --data_format yolo --tracker bytetrack --model_path weights/best.pt --save_images
+python tracker/track.py --dataset mot17 --data_format yolo --tracker bytetrack --model_path weights/best.pt --save_images
+python tracker/track.py --dataset mot17 --data_format yolo --tracker deepsort --model_path weights/best.pt --save_images
@@ -73,7 +73,7 @@ def mark_removed(self):
 """
 class STrack(BaseTrack):
     def __init__(self, cls, tlwh, score, kalman_format='default', 
-        feature=None, use_avg_of_feature=True) -> None:
+        feature=None, use_avg_of_feature=True, store_features_budget=100) -> None:
         """
         cls: category of this obj 
         tlwh: positoin   score: conf score 
@@ -95,6 +95,7 @@ def __init__(self, cls, tlwh, score, kalman_format='default',
         self.time_since_update = None
 
         self.features = []
+        self.store_features_budget = store_features_budget
         self.has_feature = True if feature is not None else False
         self.use_avg_of_feature = use_avg_of_feature
         if feature is not None:
@@ -230,6 +231,8 @@ def activate(self, frame_id):
         self.frame_id = frame_id
         self.start_frame = frame_id
 
+        self.time_since_update = 0
+
     def predict(self):
         """
         kalman predict step
@@ -254,6 +257,8 @@ def multi_predict(stracks, kalman):
                 stracks[i].mean = mean
                 stracks[i].cov = cov
 
+        for strack in stracks: strack.time_since_update += 1
+
     def re_activate(self, new_track, frame_id, new_id=False):
         """
         reactivate a lost track
@@ -275,6 +280,8 @@ def re_activate(self, new_track, frame_id, new_id=False):
             self.track_id = self.next_id()
         self.score = new_track.score
 
+        self.time_since_update = 0
+
     def update(self, new_track, frame_id):
         """
         update a track
@@ -311,12 +318,14 @@ def update(self, new_track, frame_id):
                 self.features = [smooth_feat]  # as new feature
             else:
                 self.features.append(feature)
+                self.features = self.features[-self.store_features_budget: ]
 
 
         # update status
         self.state = TrackState.Tracked
         self.is_activated = True
 
+        self.time_since_update = 0
 
 
 """
 
@@ -1,7 +1,7 @@
 
 import numpy as np  
 from basetrack import TrackState, STrack, BaseTracker
-from kalman_filter import KalmanFilter, NaiveKalmanFilter
+from kalman_filter import KalmanFilter, NaiveKalmanFilter, chi2inv95
 from reid_models.deepsort_reid import Extractor
 import matching
 import torch 
@@ -39,6 +39,43 @@ def get_feature(self, tlbrs, ori_img):
             features = np.array([])
         return features
 
+    def gate_cost_matrix(self, cost_matrix, tracks, dets, max_apperance_thresh=0.15, gated_cost=1e5, only_position=False):
+        """
+        gate cost matrix by calculating the Kalman state distance and constrainted by
+        0.95 confidence interval of x2 distribution
+
+        cost_matrix: np.ndarray, shape (len(tracks), len(dets))
+        tracks: List[STrack]
+        dets: List[STrack]
+        gated_cost: a very largt const to infeasible associations
+        only_position: use [xc, yc, a, h] as state vector or only use [xc, yc]
+
+        return:
+        updated cost_matirx, np.ndarray
+        """
+        gating_dim = 2 if only_position else 4
+        gating_threshold = chi2inv95[gating_dim]
+        measurements = np.asarray([STrack.tlwh2xyah(det.tlwh) for det in dets])  # (len(dets), 4)
+
+        cost_matrix[cost_matrix > max_apperance_thresh] = gated_cost
+        for row, track in enumerate(tracks):
+            gating_distance = self.kalman.gating_distance(
+                track.mean, track.cov, measurements, only_position
+            )
+            cost_matrix[row, gating_distance > gating_threshold] = gated_cost
+        return cost_matrix
+
+    def gated_metric(self, tracks, dets):
+        """
+        get cost matrix, firstly calculate apperence cost, then filter by Kalman state.
+
+        tracks: List[STrack]
+        dets: List[STrack]
+        """
+        Apperance_dist = matching.nearest_embedding_distance(tracks=tracks, detections=dets, metric='cosine')
+        cost_matrix = self.gate_cost_matrix(Apperance_dist, tracks, dets, )
+        return cost_matrix
+    
     def update(self, det_results, ori_img):
         """
         this func is called by every time step
@@ -85,7 +122,7 @@ def update(self, det_results, ori_img):
                 features = self.get_feature(bbox_temp, ori_img)
 
             # detections: List[Strack]
-            detections = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format, feature=feature)
+            detections = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format, feature=feature, use_avg_of_feature=False)
                             for (cls, xywh, score, feature) in zip(det_results[:, -1], det_results[:, :4], det_results[:, 4], features)]
 
         else:
@@ -106,15 +143,9 @@ def update(self, det_results, ori_img):
         # Kalman predict, update every mean and cov of tracks
         STrack.multi_predict(stracks=strack_pool, kalman=self.kalman)
 
-        # calculate apperance distance, shape:(len(strack_pool), len(detections))
-        Apperance_dist = matching.embedding_distance(tracks=strack_pool, detections=detections, metric='euclidean')
-        # calculate iou distance, shape:(len(strack_pool), len(detections))
-        IoU_dist = matching.iou_distance(atracks=strack_pool, btracks=detections)
-        # fuse
-        Dist_mat = self.gamma * IoU_dist + (1. - self.gamma) * Apperance_dist
-
         # match  thresh=0.9 is same in ByteTrack code
-        matched_pair0, u_tracks0_idx, u_dets0_idx = matching.linear_assignment(Dist_mat, thresh=0.7)
+        matched_pair0, u_tracks0_idx, u_dets0_idx = matching.matching_cascade(self.gated_metric, 0.9, self.max_time_lost, 
+                                                            strack_pool, detections)
 
         for itrack_match, idet_match in matched_pair0:
             track = strack_pool[itrack_match]
@@ -148,7 +179,6 @@ def update(self, det_results, ori_img):
                 activated_starcks.append(track)
 
             elif track.state == TrackState.Lost:
-                exit(0)
                 track.re_activate(det, self.frame_id, )
                 refind_stracks.append(track)
 
@@ -160,10 +190,8 @@ def update(self, det_results, ori_img):
             lost_stracks.append(track)
 
         # deal with unconfirmed tracks, match new track of last frame and new high conf det
-        Apperance_dist = matching.embedding_distance(tracks=unconfirmed, detections=u_det1, metric='euclidean')
-        IoU_dist = matching.iou_distance(atracks=unconfirmed, btracks=u_det1)
-        Dist_mat = self.gamma * IoU_dist + (1. - self.gamma) * Apperance_dist
-        matched_pair2, u_tracks2_idx, u_det2_idx = matching.linear_assignment(Dist_mat, thresh=0.7)
+        matched_pair2, u_tracks2_idx, u_det2_idx = matching.matching_cascade(self.gated_metric, 0.7, self.max_time_lost, 
+                                                                unconfirmed, u_det1)
 
         for itrack_match, idet_match in matched_pair2:
             track = unconfirmed[itrack_match]
@@ -179,7 +207,7 @@ def update(self, det_results, ori_img):
         # deal with new tracks
         for idx in u_det2_idx:
             det = u_det1[idx]
-            if det.score > self.det_thresh + 0.1:
+            if det.score > self.det_thresh:
                 det.activate(self.frame_id)
                 activated_starcks.append(det)
 
 
@@ -102,6 +102,29 @@ def embedding_distance(tracks, detections, metric='cosine'):
         raise NotImplementedError
     return cost_matrix
 
+def nearest_embedding_distance(tracks, detections, metric='cosine'):
+    """
+    different from embedding distance, this func calculate the 
+    nearest distance among all track history features and detections
+
+    tracks: list[STrack]
+    detections: list[STrack]
+    metric: str, cosine or euclidean
+
+    return:
+    cost_matrix, np.ndarray, shape(len(tracks), len(detections))
+    """
+    cost_matrix = np.zeros((len(tracks), len(detections)))
+    det_features = np.asarray([det.features[-1] for det in detections])
+
+    for row, track in enumerate(tracks):
+        track_history_features = np.asarray(track.features)
+        dist = 1. - cal_cosine_distance(track_history_features, det_features)
+        dist = dist.min(axis=0)
+        cost_matrix[row, :] = dist
+    
+    return cost_matrix
+
 def ecu_iou_distance(tracks, detections, img0_shape):
     """
     combine eculidian center-point distance and iou distance
@@ -189,90 +212,70 @@ def fuse_motion(kf, cost_matrix, tracks, detections, only_position=False, lambda
     return cost_matrix
 
 
-"""
-distance metric that combines multi-frame info
-used in StrongSORT
-TODO: use in DeepSORT
-"""
-
-class NearestNeighborDistanceMetric(object):
+def matching_cascade(
+        distance_metric, matching_thresh, cascade_depth, tracks, detections,
+        track_indices=None, detection_indices=None):
     """
-    A nearest neighbor distance metric that, for each target, returns
-    the closest distance to any sample that has been observed so far.
-
-    Parameters
-    ----------
-    metric : str
-        Either "euclidean" or "cosine".
-    matching_threshold: float
-        The matching threshold. Samples with larger distance are considered an
-        invalid match.
-    budget : Optional[int]
-        If not None, fix samples per class to at most this number. Removes
-        the oldest samples when the budget is reached.
-
-    Attributes
-    ----------
-    samples : Dict[int -> List[ndarray]]
-        A dictionary that maps from target identities to the list of samples
-        that have been observed so far.
-
+    Run matching cascade in DeepSORT
+
+    distance_metirc: function that calculate the cost matrix
+    matching_thresh: float, Associations with cost larger than this value are disregarded.
+    cascade_path: int, equal to max_age of a tracklet
+    tracks: List[STrack], current tracks
+    detections: List[STrack], current detections
+    track_indices: List[int], tracks that will be calculated, Default None
+    detection_indices: List[int], detections that will be calculated, Default None
+
+    return:
+    matched pair, unmatched tracks, unmatced detections: List[int], List[int], List[int]
     """
+    if track_indices is None:
+        track_indices = list(range(len(tracks)))
+    if detection_indices is None:
+        detection_indices = list(range(len(detections)))
 
-    def __init__(self, metric, matching_threshold, budget=None):
-        if metric == "euclidean":
-            self._metric = cal_eculidian_distance
-        elif metric == "cosine":
-            self._metric = cal_cosine_distance
-        else:
-            raise ValueError(
-                "Invalid metric; must be either 'euclidean' or 'cosine'")
-        self.matching_threshold = matching_threshold
-        self.budget = budget
-        self.samples = {}
-
-    def partial_fit(self, features, targets, active_targets):
-        """Update the distance metric with new data.
-
-        Parameters
-        ----------
-        features : ndarray
-            An NxM matrix of N features of dimensionality M.
-        targets : ndarray
-            An integer array of associated target identities.
-        active_targets : List[int]
-            A list of targets that are currently present in the scene.
+    detections_to_match = detection_indices
+    matches = []
 
+    for level in range(cascade_depth):
         """
-        for feature, target in zip(features, targets):
-            self.samples.setdefault(target, []).append(feature)
-            if self.budget is not None:
-                self.samples[target] = self.samples[target][-self.budget:]
-        self.samples = {k: self.samples[k] for k in active_targets}
-
-    def distance(self, features, targets):
-        """Compute distance between features and targets.
-
-        Parameters
-        ----------
-        features : ndarray
-            An NxM matrix of N features of dimensionality M.
-        targets : List[int]
-            A list of targets to match the given `features` against.
-
-        Returns
-        -------
-        ndarray
-            Returns a cost matrix of shape len(targets), len(features), where
-            element (i, j) contains the closest squared distance between
-            `targets[i]` and `features[j]`.
-
+        match new track with detection firstly
         """
-        cost_matrix = np.zeros((len(targets), len(features)))
-        for i, target in enumerate(targets):
-            cost_matrix[i, :] = self._metric(self.samples[target], features)
-        return cost_matrix
+        if not len(detections_to_match):  # No detections left
+            break
+
+        track_indices_l = [
+            k for k in track_indices
+            if tracks[k].time_since_update == 1 + level
+        ]  # filter tracks whose age is equal to level + 1 (The age of Newest track = 1)
+
+        if not len(track_indices_l):  # Nothing to match at this level
+            continue
+        
+        # tracks and detections which will be mathcted in current level
+        track_l = [tracks[idx] for idx in track_indices_l]  # List[STrack]
+        det_l = [detections[idx] for idx in detections_to_match]  # List[STrack]
+
+        # calculate the cost matrix
+        cost_matrix = distance_metric(track_l, det_l)
+
+        # solve the linear assignment problem
+        matched_row_col, umatched_row, umatched_col = \
+            linear_assignment(cost_matrix, matching_thresh)
+        
+        for row, col in matched_row_col:  # for those who matched
+            matches.append((track_indices_l[row], detections_to_match[col]))
+
+        umatched_detecion_l = []  # current detections not matched
+        for col in umatched_col:  # for detections not matched
+            umatched_detecion_l.append(detections_to_match[col])
+        
+        detections_to_match = umatched_detecion_l  # update detections to match for next level
+    unmatched_tracks = list(set(track_indices) - set(k for k, _ in matches))
+
+    return matches, unmatched_tracks, detections_to_match
 
+    
 
 """
 funcs to cal similarity, copied from UAVMOT