guoqing bakeup

2024-10-04 12:12:44 +08:00
parent 09e92d63b3
commit 390c5d2d94
37 changed files with 1409 additions and 219 deletions
--- a/track_reid.py
+++ b/track_reid.py
@ -127,6 +127,176 @@ def init_trackers(tracker_yaml = None, bs=1):
    return trackers


+@smart_inference_mode()
+def yolo_resnet_tracker(
+        weights=ROOT / 'yolov5s.pt',  # model path or triton URL
+        source=ROOT / 'data/images',  # file/dir/URL/glob/screen/0(webcam)
+        
+        project=ROOT / 'runs/detect',  # save results to project/name
+        name='exp',  # save results to project/name
+        save_dir = '',
+        
+        tracker_yaml = "./tracking/trackers/cfg/botsort.yaml",
+        imgsz=(640, 640),  # inference size (height, width)
+        conf_thres=0.25,  # confidence threshold
+        iou_thres=0.45,  # NMS IOU threshold
+        max_det=1000,  # maximum detections per image
+        device='',  # cuda device, i.e. 0 or 0,1,2,3 or cpu
+
+        view_img=False,  # show results
+        save_txt=False,  # save results to *.txt
+        save_csv=False,  # save results in CSV format
+        save_conf=False,  # save confidences in --save-txt labels
+        save_crop=False,  # save cropped prediction boxes
+        
+        nosave=False,  # do not save images/videos
+        
+        
+        classes=None,  # filter by class: --class 0, or --class 0 2 3
+        agnostic_nms=False,  # class-agnostic NMS
+        augment=False,  # augmented inference
+        visualize=False,  # visualize features
+        update=False,  # update all models
+        exist_ok=False,  # existing project/name ok, do not increment
+        line_thickness=3,  # bounding box thickness (pixels)
+        hide_labels=False,  # hide labels
+        hide_conf=False,  # hide confidencesL
+        half=False,  # use FP16 half-precision inference
+        dnn=False,  # use OpenCV DNN for ONNX inference
+        vid_stride=1,  # video frame-rate stride
+        data=ROOT / 'data/coco128.yaml',  # dataset.yaml path
+):
+    source = str(source)
+    save_img = not nosave and not source.endswith('.txt')  # save inference images
+
+    # Load model
+    device = select_device(device)
+    model = DetectMultiBackend(weights, device=device, dnn=dnn, data=data, fp16=half)
+    stride, names, pt = model.stride, model.names, model.pt
+    imgsz = check_img_size(imgsz, s=stride)  # check image size
+     
+    # Dataloader
+    bs = 1  # batch_size
+    
+    dataset = LoadImages(source, img_size=imgsz, stride=stride, auto=pt, vid_stride=vid_stride)    
+    vid_path, vid_writer = [None] * bs, [None] * bs
+
+    # Run inference
+    model.warmup(imgsz=(1 if pt or model.triton else bs, 3, *imgsz))  # warmup
+    tracker = init_trackers(tracker_yaml, bs)[0]
+    
+    dt = (Profile(), Profile(), Profile())
+    track_boxes = np.empty((0, 9), dtype = np.float32)
+    TracksDict = {}
+    for path, im, im0s, vid_cap, s in dataset:
+        with dt[0]:
+            im = torch.from_numpy(im).to(model.device)
+            im = im.half() if model.fp16 else im.float()  # uint8 to fp16/32
+            im /= 255  # 0 - 255 to 0.0 - 1.0
+            if len(im.shape) == 3:
+                im = im[None]  # expand for batch dim
+
+        # Inference
+        with dt[1]:
+            visualize = increment_path(save_dir / Path(path).stem, mkdir=True) if visualize else False
+            pred = model(im, augment=augment, visualize=visualize)
+
+        # NMS
+        with dt[2]:
+            pred = non_max_suppression(pred, conf_thres, iou_thres, classes, agnostic_nms, max_det=max_det)
+
+        # Process predictions
+        for i, det in enumerate(pred):  # per image
+            im0 = im0s.copy()
+
+            save_path = str(save_dir / Path(path).name)  # im.jpg
+            s += '%gx%g ' % im.shape[2:]  # print string
+            
+            annotator = Annotator(im0.copy(), line_width=line_thickness, example=str(names))
+
+            if len(det): 
+                # Rescale boxes from img_size to im0 size
+                det[:, :4] = scale_boxes(im.shape[2:], det[:, :4], im0.shape).round()
+                
+                # det = det.cpu().numpy()                
+                ## ================================================================ writed by WQG            
+                '''tracks: [x1, y1, x2, y2, track_id, score, cls, frame_index, box_index]
+                            0   1   2   3      4        5     6       7           8
+                          这里，frame_index 也可以用视频的 帧ID 代替, box_index 保持不变
+                '''
+                det_tracking = Boxes(det, im0.shape).cpu().numpy()
+                tracks = tracker.update(det_tracking, im0)
+                if len(tracks) == 0:
+                    continue
+                tracks[:, 7] = dataset.frame
+                
+                '''================== 1. 存储 dets/subimgs/features Dict ============='''
+                imgs, features = inference_image(im0, tracks)
+
+                # TrackerFeats = np.concatenate([TrackerFeats, features], axis=0)
+
+                imgdict = {}
+                boxdict = {}
+                featdict = {}
+                for ii, bid in enumerate(tracks[:, 8]):
+                    imgdict.update({int(bid): imgs[ii]})                    # [f"img_{int(bid)}"] = imgs[i]
+                    boxdict.update({int(bid): tracks[ii, :]})               # [f"box_{int(bid)}"] = tracks[i, :]
+                    featdict.update({int(bid): features[ii, :]})            # [f"feat_{int(bid)}"] = features[i, :]
+                TracksDict[f"frame_{int(dataset.frame)}"] = {"imgs":imgdict, "boxes":boxdict, "feats":featdict}
+                
+                track_boxes = np.concatenate([track_boxes, tracks], axis=0)
+
+                '''================== 2. 提取手势位置 ==================='''
+                for *xyxy, id, conf, cls, fid, bid in reversed(tracks):
+                    name = ('' if id==-1 else f'id:{int(id)} ') + names[int(cls)]                   
+                    label = None if hide_labels else (name if hide_conf else f'{name} {conf:.2f}')
+                    
+                    if id >=0 and cls==0:
+                        color = colors(int(cls), True)
+                    elif id >=0 and cls!=0:
+                        color = colors(int(id), True)
+                    else:
+                        color = colors(19, True)     # 19为调色板的最后一个元素
+           
+                    annotator.box_label(xyxy, label, color=color)
+
+            # Save results (image and video with tracking)
+            im0 = annotator.result()
+            save_path_img, ext = os.path.splitext(save_path)
+            if save_img:
+                if dataset.mode == 'image':
+                    imgpath = save_path_img + f"_{dataset}.png"
+                else:
+                    imgpath = save_path_img + f"_{dataset.frame}.png"
+                    
+                cv2.imwrite(Path(imgpath), im0)
+                
+                if vid_path[i] != save_path:  # new video
+                    vid_path[i] = save_path
+                    if isinstance(vid_writer[i], cv2.VideoWriter):
+                        vid_writer[i].release()  # release previous video writer
+                    if vid_cap:  # video
+                        fps = vid_cap.get(cv2.CAP_PROP_FPS)
+                        w = int(vid_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+                        h = int(vid_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+                    else:  # stream
+                        fps, w, h = 30, im0.shape[1], im0.shape[0]
+                    save_path = str(Path(save_path).with_suffix('.mp4'))  # force *.mp4 suffix on results videos
+                    vid_writer[i] = cv2.VideoWriter(save_path, cv2.VideoWriter_fourcc(*'mp4v'), fps, (w, h))
+                vid_writer[i].write(im0)
+
+        # Print time (inference-only)
+        LOGGER.info(f"{s}{'' if len(det) else '(no detections), '}{dt[1].dt * 1E3:.1f}ms")
+    
+    ## track_boxes: Array, [x1, y1, x2, y2, track_id, score, cls, frame_index, box_id]
+    TracksDict.update({"TrackBoxes": track_boxes})
+
+
+    return TracksDict
+    
+
+
+
@smart_inference_mode()
 def run(
        weights=ROOT / 'yolov5s.pt',  # model path or triton URL
@ -438,7 +608,8 @@ def run(


 def parse_opt():
-    modelpath = ROOT / 'ckpts/best_yolov5m_250000.pt'       # 'ckpts/best_15000_0908.pt',  'ckpts/yolov5s.pt', 'ckpts/best_20000_cls30.pt'
+    modelpath = ROOT / 'ckpts/best_cls10_0906.pt'       # 'ckpts/best_15000_0908.pt',  'ckpts/yolov5s.pt', 'ckpts/best_20000_cls30.pt, best_yolov5m_250000'
+    
    
    '''datapath为视频文件目录或视频文件'''
    datapath = r"D:/datasets/ym/videos/标记视频/"   # ROOT/'data/videos',  ROOT/'data/images'   images    
@ -522,7 +693,8 @@ def main_loop(opt):
    # p = r"D:\datasets\ym\videos\标记视频"
    # p = r"D:\datasets\ym\实验室测试"
    # p = r"D:\datasets\ym\永辉双摄视频\新建文件夹"
-    p = r"\\192.168.1.28\share\测试_202406\0723\0723_2\20240723-112522_"
+    # p = r"\\192.168.1.28\share\测试_202406\0723\0723_2\20240723-112522_"
+    p = r"D:\datasets\ym\联华中环"
    
    k = 0
    if os.path.isdir(p):