xuan2261
diff --git a/‎.gitignore
Lines changed: 7 additions & 0 deletions b/‎.gitignore
Lines changed: 7 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 4 additions & 2 deletions b/‎README.md
Lines changed: 4 additions & 2 deletions
diff --git a/‎data/uavdt.yaml
Lines changed: 7 additions & 0 deletions b/‎data/uavdt.yaml
Lines changed: 7 additions & 0 deletions
diff --git a/‎run_yolov7.txt
Lines changed: 3 additions & 1 deletion b/‎run_yolov7.txt
Lines changed: 3 additions & 1 deletion
diff --git a/‎tools/convert_UAVDT_to_yolo.py
Lines changed: 2 additions & 2 deletions b/‎tools/convert_UAVDT_to_yolo.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎tracker/basetrack.py
Lines changed: 13 additions & 16 deletions b/‎tracker/basetrack.py
Lines changed: 13 additions & 16 deletions
diff --git a/‎tracker/botsort.py
Lines changed: 7 additions & 22 deletions b/‎tracker/botsort.py
Lines changed: 7 additions & 22 deletions
diff --git a/‎tracker/bytetrack.py
Lines changed: 7 additions & 21 deletions b/‎tracker/bytetrack.py
Lines changed: 7 additions & 21 deletions
diff --git a/‎tracker/c_biou_tracker.py
Lines changed: 14 additions & 17 deletions b/‎tracker/c_biou_tracker.py
Lines changed: 14 additions & 17 deletions
diff --git a/‎tracker/deepmot.py
Lines changed: 5 additions & 18 deletions b/‎tracker/deepmot.py
Lines changed: 5 additions & 18 deletions
@@ -3,6 +3,13 @@ weights/*
 !weights/ckpt.t7
 !weights/DHN.pth 
 !weights/osnet_x0_25.pth
+visdrone/*
+uavdt/*
+mot17/*
+runs/*
+wandb/*
+track_result.txt
+.idea/
 
 # Byte-compiled / optimized / DLL files
 __pycache__/
 
@@ -2,6 +2,8 @@
 
 ## 0. 更新记录
 
+**2023.5.6[大更新]**: 对于v5, v7, 改变前处理和后处理方式(采用原有方式), ***解决了部分边界框近大远小的bug, 边界框更加精确***. 此外, 对于v8, 弃用了resize步骤, 直接推理.
+
 **2023.3.14**解决了`DeepSORT`和`C_BIoUTracker`后面出现的目标不跟踪的bug.  
 
 **2023.2.28**优化了`track_demo.py`, 减少了内存占用.  
@@ -34,7 +36,7 @@ YOLO v8 代码的参数与之前完全相同. 安装YOLO v8以及训练步骤请
 
 **2022.10.15**增加了对yolo v5的支持, 只需替换track.py, 将tracker文件夹放到v5的根目录(我测试的是官方的[repo](https://github.com/ultralytics/yolov5))下即可. 代码在[yolo v5](https://github.com/JackWoo0831/Yolov7-tracker/blob/master/tracker/track_yolov5.py). 
 
-**2022.09.27**修复了STrack类中update不更新外观的问题, 代码有较大更改, **您可能需要重新下载```./tracker```文件夹**. 
+**2022.09.27[大更新]**修复了STrack类中update不更新外观的问题, 代码有较大更改, **您可能需要重新下载```./tracker```文件夹**. 
 尝试加入StrongSORT, 但是目前还不work:(, 尽力调一调
 
 ## 1. 亮点  
@@ -144,7 +146,7 @@ origin意味着您直接使用数据集原本的路径, **而不是通过yolo要
 DATA_ROOT的值应为/data/datasets/VisDrone2019/VisDrone2019-MOT-test-dev/sequences, 即DATA_ROOT目录下应该为各个视频序列的文件夹.
 ```
 
-***2. yolo***
+***2. yolo[推荐]***
 
 yolo格式意味着您通过yolo训练时所要求的txt文件读取序列. 我们知道yolo要求txt文件记录图片的路径, 例如:
 
 
@@ -0,0 +1,7 @@
+train: ./uavdt/train.txt
+val: ./uavdt/test.txt
+test: ./uavdt/test.txt
+
+nc: 1
+
+names: ['car']
@@ -17,6 +17,8 @@ python train_aux.py --dataset visdrone --workers 8 --device 4 --batch-size 16 --
 ## all category
 python train_aux.py --dataset visdrone --workers 8 --device 0 --batch-size 16 --data data/visdrone_all.yaml --img 1280 1280 --cfg cfg/training/yolov7-w6.yaml --weights './weights/yolov7-w6_training.pt' --name yolov7-w6-custom --hyp data/hyp.scratch.custom.yaml
 
+uavdt:
+python train_aux.py --dataset uavdt --workers 8 --device 5 --batch-size 16 --data data/uavdt.yaml --img 1280 1280 --cfg cfg/training/yolov7-w6.yaml --weights './weights/yolov7-w6_training.pt' --name yolov7-w6-custom --hyp data/hyp.scratch.custom.yaml
 
 ## all category, no mosaic, rect training
 NOTE: edited augment = False in line 246, train_aux.py
@@ -61,4 +63,4 @@ CUDA_VISIBLE_DEVICES=0 python train_aux.py --dataset mot17 --workers 8 --device
 track:
 python tracker/track.py --dataset mot17 --data_format yolo --tracker sort --model_path runs/train/yolov7-w6-custom3/weights/best.pt --save_images
 python tracker/track.py --dataset mot17 --data_format yolo --tracker bytetrack --model_path weights/best.pt --save_images
-python tracker/track.py --dataset mot17 --data_format yolo --tracker deepsort --model_path weights/best.pt --save_images
+python tracker/track.py --dataset mot17 --data_format yolo --tracker deepsort --model_path weights/best.pt --save_images
@@ -47,7 +47,7 @@ def generate_imgs_and_labels(opts):
 
     # 分别处理train与test
     process_train_test(train_seq_list, frame_range, CATEGOTY_ID, 'train')
-    process_train_test(test_seq_list, frame_range, CATEGOTY_ID, 'test')
+    process_train_test(test_seq_list, {'start': 0.0, 'end': 1.0}, CATEGOTY_ID, 'test')
     print('All Done!!')
 
 
@@ -156,4 +156,4 @@ def process_train_test(seqs: list, frame_range: dict, cat_id: int = 0, split: st
     opts = parser.parse_args()
 
     generate_imgs_and_labels(opts)
-    # python uav_tools/convert_UAVDT_to_yolo.py --generate_imgs --half --random
+    # python tools/convert_UAVDT_to_yolo.py --generate_imgs --half --random
@@ -107,6 +107,17 @@ def __init__(self, cls, tlwh, score, kalman_format='default',
         self.mean, self.cov = None, None  # for kalman predict
 
     # some tool funcs 
+    @staticmethod
+    def tlbr2tlwh(tlbr):
+        """
+        convert tlbr to tlwh
+        """
+        result = np.asarray(tlbr).copy()
+        result[2] -= result[0]
+        result[3] -= result[1]
+
+        return result
+
     @staticmethod
     def tlwh2xyah(tlwh):
         """
@@ -375,26 +386,12 @@ def update(self, det_results, ori_img):
         """step 1. filter results and init tracks"""
         det_results = det_results[det_results[:, 4] > self.det_thresh]
 
-        # convert the scale to origin size
-        # NOTE: yolo v7 origin out format: [xc, yc, w, h, conf, cls0_conf, cls1_conf, ..., clsn_conf]
-        # TODO: check here, if nesscessary use two ratio
-        img_h, img_w = ori_img.shape[0], ori_img.shape[1]
-        ratio = [img_h / self.model_img_size[0], img_w / self.model_img_size[1]]  # usually > 1
-        det_results[:, 0], det_results[:, 2] =  det_results[:, 0]*ratio[1], det_results[:, 2]*ratio[1]
-        det_results[:, 1], det_results[:, 3] =  det_results[:, 1]*ratio[0], det_results[:, 3]*ratio[0]
-
 
         if det_results.shape[0] > 0:
-            if self.NMS:
-                # TODO: Note nms need tlbr format
-                bbox_temp = STrack.xywh2tlbr(det_results[:, :4])
-                nms_indices = nms(torch.from_numpy(bbox_temp), torch.from_numpy(det_results[:, 4]), 
-                                self.opts.nms_thresh)
-                det_results = det_results[nms_indices.numpy()]
 
             # detections: List[Strack]
-            detections = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                            for (cls, xywh, score) in zip(det_results[:, -1], det_results[:, :4], det_results[:, 4])]
+            detections = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                            for (cls, tlbr, score) in zip(det_results[:, -1], det_results[:, :4], det_results[:, 4])]
 
         else:
             detections = []
 
@@ -328,28 +328,13 @@ def update(self, det_results, ori_img):
         lost_stracks = []           # The tracks which are not obtained in the current frame but are not removed.(Lost for some time lesser than the threshold for removing)
         removed_stracks = []
 
-        # convert the scale to origin size
-        # NOTE: yolo v7 origin out format: [xc, yc, w, h, conf, cls0_conf, cls1_conf, ..., clsn_conf]
-        # TODO: check here, if nesscessary use two ratio
-        img_h, img_w = ori_img.shape[0], ori_img.shape[1]
-        ratio = [img_h / self.model_img_size[0], img_w / self.model_img_size[1]]  # usually > 1
-        det_results[:, 0], det_results[:, 2] =  det_results[:, 0]*ratio[1], det_results[:, 2]*ratio[1]
-        det_results[:, 1], det_results[:, 3] =  det_results[:, 1]*ratio[0], det_results[:, 3]*ratio[0]
-
         """step 1. filter results and init tracks"""
 
         # filter small area bboxs
         if self.filter_small_area:  
             small_indicies = det_results[:, 2]*det_results[:, 3] > 50
             det_results = det_results[small_indicies]
 
-        # run NMS
-        if self.NMS:
-            # NOTE: Note nms need tlbr format
-            nms_indices = nms(torch.from_numpy(STrack.xywh2tlbr(det_results[:, :4])), torch.from_numpy(det_results[:, 4]), 
-                            self.opts.nms_thresh)
-            det_results = det_results[nms_indices.numpy()]
-
         # cal high and low indicies
         det_high_indicies = det_results[:, 4] >= self.det_thresh
         det_low_indicies = np.logical_and(np.logical_not(det_high_indicies), det_results[:, 4] > self.low_conf_thresh)
@@ -358,19 +343,19 @@ def update(self, det_results, ori_img):
         det_high, det_low = det_results[det_high_indicies], det_results[det_low_indicies]
         if det_high.shape[0] > 0:
             if self.use_apperance_model:
-                features = self.get_feature(STrack.xywh2tlbr(det_high[:, :4]), ori_img)
+                features = self.get_feature(det_high[:, :4], ori_img)
                 # detections: List[Strack]
-                D_high = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format, feature=feature)
-                                for (cls, xywh, score, feature) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4], features)]
+                D_high = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format, feature=feature)
+                                for (cls, tlbr, score, feature) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4], features)]
             else:
-                D_high = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                            for (cls, xywh, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
+                D_high = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                            for (cls, tlbr, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
         else:
             D_high = []
 
         if det_low.shape[0] > 0:
-            D_low = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                            for (cls, xywh, score) in zip(det_low[:, -1], det_low[:, :4], det_low[:, 4])]
+            D_low = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                            for (cls, tlbr, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
         else:
             D_low = []
 
 
@@ -57,27 +57,13 @@ def update(self, det_results, ori_img):
         lost_stracks = []           # The tracks which are not obtained in the current frame but are not removed.(Lost for some time lesser than the threshold for removing)
         removed_stracks = []
 
-        # convert the scale to origin size
-        # NOTE: yolo v7 origin out format: [xc, yc, w, h, conf, cls0_conf, cls1_conf, ..., clsn_conf]
-        # TODO: check here, if nesscessary use two ratio
-        img_h, img_w = ori_img.shape[0], ori_img.shape[1]
-        ratio = [img_h / self.model_img_size[0], img_w / self.model_img_size[1]]  # usually > 1
-        det_results[:, 0], det_results[:, 2] =  det_results[:, 0]*ratio[1], det_results[:, 2]*ratio[1]
-        det_results[:, 1], det_results[:, 3] =  det_results[:, 1]*ratio[0], det_results[:, 3]*ratio[0]
-
         """step 1. filter results and init tracks"""
 
         # filter small area bboxs
         if self.filter_small_area:  
             small_indicies = det_results[:, 2]*det_results[:, 3] > 50
             det_results = det_results[small_indicies]
 
-        # run NMS
-        if self.NMS:
-            # NOTE: Note nms need tlbr format
-            nms_indices = nms(torch.from_numpy(STrack.xywh2tlbr(det_results[:, :4])), torch.from_numpy(det_results[:, 4]), 
-                            self.opts.nms_thresh)
-            det_results = det_results[nms_indices.numpy()]
 
         # cal high and low indicies
         det_high_indicies = det_results[:, 4] >= self.det_thresh
@@ -88,19 +74,19 @@ def update(self, det_results, ori_img):
         det_high, det_low = det_results[det_high_indicies], det_results[det_low_indicies]
         if det_high.shape[0] > 0:
             if self.use_apperance_model:
-                features = self.get_feature(STrack.xywh2tlbr(det_high[:, :4]), ori_img)
+                features = self.get_feature(det_high[:, :4], ori_img)
                 # detections: List[Strack]
-                D_high = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format, feature=feature)
-                                for (cls, xywh, score, feature) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4], features)]
+                D_high = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format, feature=feature)
+                                for (cls, tlbr, score, feature) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4], features)]
             else:
-                D_high = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                            for (cls, xywh, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
+                D_high = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                            for (cls, tlbr, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
         else:
             D_high = []
 
         if det_low.shape[0] > 0:
-            D_low = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                            for (cls, xywh, score) in zip(det_low[:, -1], det_low[:, :4], det_low[:, 4])]
+            D_low = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                            for (cls, tlbr, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
         else:
             D_low = []
 
 
@@ -61,7 +61,6 @@ def get_buffer_bbox(self, level=1, bbox=None):
             buffer_bbox = bbox + np.array([-b*bbox[2], -b*bbox[3], 2*b*bbox[2], 2*b*bbox[3]])
         return np.maximum(0.0, buffer_bbox)
 
-
     @property
     def tlbr(self):
         ret = self.origin_bbox_buffer[-1].copy()
@@ -152,6 +151,18 @@ def update(self, new_track, frame_id):
 
         self.time_since_update = 0
 
+
+    @staticmethod
+    def tlbr2tlwh(tlbr):
+        """
+        convert tlbr to tlwh
+        """
+        result = np.asarray(tlbr).copy()
+        result[2] -= result[0]
+        result[3] -= result[1]
+
+        return result
+
     @staticmethod
     def xywh2tlbr(xywh):
         """
@@ -226,25 +237,11 @@ def update(self, det_results, ori_img):
         """step 1. filter results and init tracks"""
         det_results = det_results[det_results[:, 4] > self.det_thresh]
 
-        # convert the scale to origin size
-        # NOTE: yolo v7 origin out format: [xc, yc, w, h, conf, cls0_conf, cls1_conf, ..., clsn_conf]
-        # TODO: check here, if nesscessary use two ratio
-        img_h, img_w = ori_img.shape[0], ori_img.shape[1]
-        ratio = [img_h / self.model_img_size[0], img_w / self.model_img_size[1]]  # usually > 1
-        det_results[:, 0], det_results[:, 2] =  det_results[:, 0]*ratio[1], det_results[:, 2]*ratio[1]
-        det_results[:, 1], det_results[:, 3] =  det_results[:, 1]*ratio[0], det_results[:, 3]*ratio[0]
-
         if det_results.shape[0] > 0:
-            if self.NMS:
-                # TODO: Note nms need tlbr format
-                bbox_temp = C_BIoUSTrack.xywh2tlbr(det_results[:, :4])
-                nms_indices = nms(torch.from_numpy(bbox_temp), torch.from_numpy(det_results[:, 4]), 
-                                self.opts.nms_thresh)
-                det_results = det_results[nms_indices.numpy()]
 
             # detections: List[Strack]
-            detections = [C_BIoUSTrack(cls, C_BIoUSTrack.xywh2tlwh(xywh), score)
-                            for (cls, xywh, score) in zip(det_results[:, -1], det_results[:, :4], det_results[:, 4])]
+            detections = [C_BIoUSTrack(cls, C_BIoUSTrack.tlbr2tlwh(tlbr), score)
+                            for (cls, tlbr, score) in zip(det_results[:, -1], det_results[:, :4], det_results[:, 4])]
 
         else:
             detections = []
 
@@ -176,42 +176,29 @@ def update(self, det_results, ori_img):
         lost_stracks = []           # The tracks which are not obtained in the current frame but are not removed.(Lost for some time lesser than the threshold for removing)
         removed_stracks = []
 
-        # convert the scale to origin size
-        # NOTE: yolo v7 origin out format: [xc, yc, w, h, conf, cls0_conf, cls1_conf, ..., clsn_conf]
-        # TODO: check here, if nesscessary use two ratio
-        img_h, img_w = ori_img.shape[0], ori_img.shape[1]
-        ratio = [img_h / self.model_img_size[0], img_w / self.model_img_size[1]]  # usually > 1
-        det_results[:, 0], det_results[:, 2] =  det_results[:, 0]*ratio[1], det_results[:, 2]*ratio[1]
-        det_results[:, 1], det_results[:, 3] =  det_results[:, 1]*ratio[0], det_results[:, 3]*ratio[0]
-
         """step 1. filter results and init tracks"""
 
         # filter small area bboxs
         if self.filter_small_area:  
             small_indicies = det_results[:, 2]*det_results[:, 3] > 50
             det_results = det_results[small_indicies]
 
-        # run NMS
-        if self.NMS:
-            # NOTE: Note nms need tlbr format
-            nms_indices = nms(torch.from_numpy(STrack.xywh2tlbr(det_results[:, :4])), torch.from_numpy(det_results[:, 4]), 
-                            self.opts.nms_thresh)
-            det_results = det_results[nms_indices.numpy()]
 
         # cal high and low indicies
         det_high_indicies = det_results[:, 4] >= self.det_thresh
         det_low_indicies = np.logical_and(np.logical_not(det_high_indicies), det_results[:, 4] > self.low_conf_thresh)
 
         det_high, det_low = det_results[det_high_indicies], det_results[det_low_indicies]
+
         if det_high.shape[0] > 0:
-            D_high = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                        for (cls, xywh, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
+            D_high = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                        for (cls, tlbr, score) in zip(det_high[:, -1], det_high[:, :4], det_high[:, 4])]
         else:
             D_high = []
 
         if det_low.shape[0] > 0:
-            D_low = [STrack(cls, STrack.xywh2tlwh(xywh), score, kalman_format=self.opts.kalman_format)
-                            for (cls, xywh, score) in zip(det_low[:, -1], det_low[:, :4], det_low[:, 4])]
+            D_low = [STrack(cls, STrack.tlbr2tlwh(tlbr), score, kalman_format=self.opts.kalman_format)
+                            for (cls, tlbr, score) in zip(det_low[:, -1], det_low[:, :4], det_low[:, 4])]
         else:
             D_low = []