运行deepsort的track遇到的问题

运行yolov5+deepsort的时候得到deepsort的运动轨迹是这样的

但是使用yolov5的识别结果是

是哪里不匹配？问题可能出现在哪里呢
附上deepsort代码

import sys
sys.path.insert(0, './yolov5')

from yolov5.utils.datasets import LoadImages, LoadStreams
from yolov5.utils.general import check_img_size, non_max_suppression, scale_coords
from yolov5.utils.torch_utils import select_device, time_synchronized
from deep_sort_pytorch.utils.parser import get_config
from deep_sort_pytorch.deep_sort import DeepSort
import argparse
import os
import platform
import shutil
import time
from pathlib import Path
import cv2
import torch
import torch.backends.cudnn as cudnn
import numpy as np


palette = (2 ** 11 - 1, 2 ** 15 - 1, 2 ** 20 - 1)


def bbox_rel(*xyxy):
    """" Calculates the relative bounding box from absolute pixel values. """
    bbox_left = min([xyxy[0].item(), xyxy[2].item()])
    bbox_top = min([xyxy[1].item(), xyxy[3].item()])
    bbox_w = abs(xyxy[0].item() - xyxy[2].item())
    bbox_h = abs(xyxy[1].item() - xyxy[3].item())
    x_c = (bbox_left + bbox_w / 2)
    y_c = (bbox_top + bbox_h / 2)
    w = bbox_w
    h = bbox_h
    return x_c, y_c, w, h


def compute_color_for_labels(label):
    """
    Simple function that adds fixed color depending on the class
    """
    color = [int((p * (label ** 2 - label + 1)) % 255) for p in palette]
    return tuple(color)


def draw_boxes(img, bbox, identities=None, offset=(0, 0)):
    for i, box in enumerate(bbox):
        x1, y1, x2, y2 = [int(i) for i in box]
        x1 += offset[0]
        x2 += offset[0]
        y1 += offset[1]
        y2 += offset[1]
        # box text and bar
        id = int(identities[i]) if identities is not None else 0
        color = compute_color_for_labels(id)
        label = '{}{:d}'.format("", id)
        t_size = cv2.getTextSize(label, cv2.FONT_HERSHEY_PLAIN, 2, 2)[0]
        cv2.rectangle(img, (x1, y1), (x2, y2), color, 3)
        cv2.rectangle(
            img, (x1, y1), (x1 + t_size[0] + 3, y1 + t_size[1] + 4), color, -1)
        cv2.putText(img, label, (x1, y1 +
                                 t_size[1] + 4), cv2.FONT_HERSHEY_PLAIN, 2, [255, 255, 255], 2)
    return img


# xyxy2tlwh函数  这个函数一般都会自带
def xyxy2tlwh(x):
    '''
    (top left x, top left y,width, height)
    '''
    y = torch.zeros_like(x) if isinstance(x,
                                          torch.Tensor) else np.zeros_like(x)
    y[:, 0] = x[:, 0]
    y[:, 1] = x[:, 1]
    y[:, 2] = x[:, 2] - x[:, 0]
    y[:, 3] = x[:, 3] - x[:, 1]
    return y

def detect(opt, save_img=False):
    out, source, weights, view_img, save_txt, imgsz = \
        opt.output, opt.source, opt.weights, opt.view_img, opt.save_txt, opt.img_size
    webcam = source == '0' or source.startswith(
        'rtsp') or source.startswith('http') or source.endswith('.txt')

    # initialize deepsort
    cfg = get_config()
    cfg.merge_from_file(opt.config_deepsort)
    deepsort = DeepSort('D:\yolo\yolov5\yolov5-master\Yolov5_DeepSort_Pytorch\deep_sort_pytorch\deep_sort\deep\checkpoint/ckpt5.t7',
                        max_dist=cfg.DEEPSORT.MAX_DIST, min_confidence=cfg.DEEPSORT.MIN_CONFIDENCE,
                        nms_max_overlap=cfg.DEEPSORT.NMS_MAX_OVERLAP, max_iou_distance=cfg.DEEPSORT.MAX_IOU_DISTANCE,
                        max_age=cfg.DEEPSORT.MAX_AGE, n_init=cfg.DEEPSORT.N_INIT, nn_budget=cfg.DEEPSORT.NN_BUDGET,
                        use_cuda=True)

    # Initialize
    device = select_device(opt.device)
    if os.path.exists(out):
        shutil.rmtree(out)  # delete output folder
    os.makedirs(out)  # make new output folder
    half = device.type != 'cpu'  # half precision only supported on CUDA

    # Load model
    model = torch.load(weights, map_location={'0':'CPU'})[
        'model'].float()  # load to FP32
    model.to(device).eval()
    if half:
        model.half()  # to FP16

    # Set Dataloader
    vid_path, vid_writer = None, None
    if webcam:
        view_img = True
        cudnn.benchmark = True  # set True to speed up constant image size inference
        dataset = LoadStreams(source, img_size=imgsz)
    else:
        view_img = True
        save_img = True
        dataset = LoadImages(source, img_size=imgsz)

    # Get names and colors
    names = model.module.names if hasattr(model, 'module') else model.names

    # Run inference
    t0 = time.time()
    img = torch.zeros((1, 3, imgsz, imgsz), device=device)  # init img
    # run once
    _ = model(img.half() if half else img) if device.type != 'cpu' else None

    save_path = str(Path(out))
    txt_path = str(Path(out)) + '/results.txt'
    dict_box=dict()

    for frame_idx, (path, img, im0s, vid_cap) in enumerate(dataset):
        img = torch.from_numpy(img).to(device)
        img = img.half() if half else img.float()  # uint8 to fp16/32
        img /= 255.0  # 0 - 255 to 0.0 - 1.0
        if img.ndimension() == 3:
            img = img.unsqueeze(0)

        # Inference
        t1 = time_synchronized()
        pred = model(img, augment=opt.augment)[0]

        # Apply NMS
        pred = non_max_suppression(
            pred, opt.conf_thres, opt.iou_thres, classes=opt.classes, agnostic=opt.agnostic_nms)
        t2 = time_synchronized()

        # Process detections
        for i, det in enumerate(pred):  # detections per image
            if webcam:  # batch_size >= 1
                p, s, im0 = path[i], '%g: ' % i, im0s[i].copy()
            else:
                p, s, im0 = path, '', im0s

            s += '%gx%g ' % img.shape[2:]  # print string
            save_path = str(Path(out) / Path(p).name)

            if det is not None and len(det):
                # Rescale boxes from img_size to im0 size
                #det[:, :4] = scale_coords(
                    #img.shape[2:], det[:, :4], im0.shape).round()

                # Print results
                for c in det[:, -1].unique():
                    n = (det[:, -1] == c).sum()  # detections per class
                    s += '%g %ss, ' % (n, names[int(c)])  # add to string

                bbox_xywh = []
                confs = []

                # Adapt detections to deep sort input format
                for *xyxy, conf, cls in det:
                    x_c, y_c, bbox_w, bbox_h = bbox_rel(*xyxy)
                    obj = [x_c, y_c, bbox_w, bbox_h]
                    bbox_xywh.append(obj)
                    confs.append([conf.item()])

                xywhs = torch.Tensor(bbox_xywh)
                confss = torch.Tensor(confs)

                # Pass detections to deepsort
                outputs = deepsort.update(xywhs, confss, im0)
                # outputs = [x1, y1, x2, y2, track_id]
                if len(outputs) > 0:
                    bbox_xyxy = outputs[:, :4]  # 提取前四列  坐标
                    identities = outputs[:, -1]  # 提取最后一列 ID
                    box_xywh = xyxy2tlwh(bbox_xyxy)
                    # xyxy2tlwh是坐标格式转换，从x1, y1, x2, y2转为top left x ,top left y, w, h 具体函数看文章最后
                    for j in range(len(box_xywh)):
                        x_center = box_xywh[j][0] + box_xywh[j][2] / 2  # 求框的中心x坐标
                        y_center = box_xywh[j][1] + box_xywh[j][3] / 2  # 求框的中心y坐标
                        id = outputs[j][-1]
                        center = [x_center, y_center]
                        dict_box.setdefault(id, []).append(center)  # 这个字典需要提前定义 dict_box = dict()
                    # 以下为画轨迹，原理就是将前后帧同ID的跟踪框中心坐标连接起来
                    if frame_idx > 2:
                        for key, value in dict_box.items():
                            for a in range(len(value) - 1):
                                # color = COLORS_10[key % len(COLORS_10)]
                                index_start = a
                                index_end = index_start + 1
                                cv2.line(im0, tuple(map(int, value[index_start])), tuple(map(int, value[index_end])),
                                         # map(int,"1234")转换为list[1,2,3,4]
                                        (255, 0, 0), thickness=2, lineType=8)

                # draw boxes for visualization
                if len(outputs) > 0:
                    bbox_xyxy = outputs[:, :4]
                    identities = outputs[:, -1]
                    draw_boxes(im0, bbox_xyxy, identities)

                # Write MOT compliant results to file
                if save_txt and len(outputs) != 0:
                    for j, output in enumerate(outputs):
                        bbox_left = output[0]
                        bbox_top = output[1]
                        bbox_w = output[2]
                        bbox_h = output[3]
                        identity = output[-1]
                        with open(txt_path, 'a') as f:
                            f.write(('%g ' * 10 + '\n') % (frame_idx, identity, bbox_left,
                                                           bbox_top, bbox_w, bbox_h, -1, -1, -1, -1))  # label format

            else:
                deepsort.increment_ages()

            # Print time (inference + NMS)
            print('%sDone. (%.3fs)' % (s, t2 - t1))

            # Stream results
            if view_img:
                cv2.imshow(p, im0)
                if cv2.waitKey(1) == ord('q'):  # q to quit
                    raise StopIteration

            # Save results (image with detections)
            if save_img:
                print('saving img!')
                if dataset.mode == 'images':
                    cv2.imwrite(save_path, im0)
                else:
                    print('saving video!')
                    if vid_path != save_path:  # new video
                        vid_path = save_path
                        if isinstance(vid_writer, cv2.VideoWriter):
                            vid_writer.release()  # release previous video writer

                        fps = vid_cap.get(cv2.CAP_PROP_FPS)
                        w = int(vid_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
                        h = int(vid_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
                        vid_writer = cv2.VideoWriter(
                            save_path, cv2.VideoWriter_fourcc(*opt.fourcc), fps, (w, h))
                    vid_writer.write(im0)

    if save_txt or save_img:
        print('Results saved to %s' % os.getcwd() + os.sep + out)
        if platform == 'darwin':  # MacOS
            os.system('open ' + save_path)

    print('Done. (%.3fs)' % (time.time() - t0))


if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('--weights', type=str,
                        default='D:\yolo\yolov5\yolov5-master/runs/train\exp15\weights/best.pt', help='model.pt path')
    # file/folder, 0 for webcam
    parser.add_argument('--source', type=str,
                        default='D:\yolo\yolov5\pic\mouse white.mov', help='source')
    parser.add_argument('--output', type=str, default='inference/output',
                        help='output folder')  # output folder
    parser.add_argument('--img-size', type=int, default=640,
                        help='inference size (pixels)')
    parser.add_argument('--conf-thres', type=float,
                        default=0.4, help='object confidence threshold')
    parser.add_argument('--iou-thres', type=float,
                        default=0.5, help='IOU threshold for NMS')
    parser.add_argument('--fourcc', type=str, default='mp4v',
                        help='output video codec (verify ffmpeg support)')
    parser.add_argument('--device', default='',
                        help='cuda device, i.e. 0 or 0,1,2,3 or cpu')
    parser.add_argument('--view-img', action='store_true',
                        help='display results')
    parser.add_argument('--save-txt', default="true", action='store_true',
                        help='save results to *.txt')
    # class 0 is person
    parser.add_argument('--classes', nargs='+', type=int,
                        default=[0], help='filter by class')
    parser.add_argument('--agnostic-nms', action='store_true',
                        help='class-agnostic NMS')
    parser.add_argument('--augment', action='store_true',
                        help='augmented inference')
    parser.add_argument("--config_deepsort", type=str,
                        default="deep_sort_pytorch/configs/deep_sort.yaml")
    args = parser.parse_args()
    args.img_size = check_img_size(args.img_size)
    print(args)

    with torch.no_grad():
        detect(args)

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

5条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
专家-赤兔[在线] 全栈领域优质创作者 2024-05-06 14:34
关注
引自免费微信小程序：皆我百晓生

在您提供的代码中，detect 函数负责处理图像并应用DeepSort进行目标追踪。看起来您遇到了一些问题，导致跟踪结果不理想。首先，我们需要确定问题出在哪里。

根据您提供的描述，运动轨迹可能存在问题。让我们逐段检查代码，找出可能导致问题的部分，并提供相应的修改建议。

compute_color_for_labels 和 draw_boxes 函数：这些函数与运动轨迹无关，因此它们不是问题所在。
xyxy2tlwh 函数：这个函数用于将边界框从xyxy格式（左上角、右下角）转换为tlwh格式（左上角、宽度、高度），看起来没有问题。
detect 函数：
在计算跟踪结果时，您使用了dict_box字典来存储每个ID对应的中心点。这一步应该没问题。
然后，您在循环内通过cv2.line绘制轨迹线。这里可能出现问题是，在每次迭代中都重新开始绘制线，而不是连续绘制。为了修复这个问题，您需要在每次循环外部初始化一个空列表，然后在每次迭代中添加新的中心点，最后在循环结束后一次性绘制所有线。

下面是针对以上分析对代码做出的修改：

def detect(opt, save_img=False): ... dict_box = {} # 初始化字典 points_to_connect = [] # 新增用于保存需要连接的点的列表 ... for frame_idx, ...: ... if len(outputs) > 0: ... for j in range(len(box_xywh)): ... center = [x_center, y_center] dict_box.setdefault(id, []).append(center) points_to_connect.extend([(center, id)]) # 将每个中心点和其对应ID作为元组添加到列表中 if frame_idx > 2: # 避免在前三帧绘制线，因为此时还没有足够的点 for point, id in points_to_connect: # 连接所有的点 for a in range(len(dict_box[id]) - 1): start = dict_box[id][a] end = dict_box[id][a + 1] cv2.line(im0, tuple(map(int, start)), tuple(map(int, end)), (255, 0, 0), thickness=2, lineType=8) points_to_connect.clear() # 清空列表，准备下一轮迭代 ...

这样应该可以解决运动轨迹的问题。注意，上述代码是在原始代码的基础上进行了修改。将这些更改应用于您的源代码，并再次运行程序，看看是否解决了轨迹显示的问题。如果有其他问题，或者您需要进一步的帮助，请随时告诉我。
解决无用
评论打赏
分享
举报编辑记录

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

FlatBuffers的多语言集成问题 c++
2018-11-06 23:06

回答 2 已采纳 Not sure if this the entire problem, but a quick glance at convertStreamMessage shows a major prob
如何获取Koreography Track中的列表 unity 游戏引擎
2023-03-09 18:08

回答 1 已采纳直接读取文件，其实是一个xml的文件，里面就有。
Go中的追加行为不一致？
2019-02-11 01:35

回答 1 已采纳 I has nothing to do with append. You are doing a DFS-traversal of a binary tree, the order is cal
用 YOLO v5+DeepSORT，打造实时多目标跟踪模型
2021-08-20 16:00

AI科技大本营的博客相关论文： https://arxiv.org/pdf/1602.00763.pdf 2、DeepSORT DeepSORT 是 SORT 的升级版，它整合了外观信息 (appearance information) 从而提高 SORT 的性能，这使得我们在遇到较长时间的遮挡时，也能够正常跟踪...
Gitlab CI-Auto DevOps作业失败，无法为Go项目选择构建包？
2018-11-08 19:45

回答 1 已采纳 From the AutoDevops documentation: Auto Build creates a build of the application in one of two
如何保持死去的去例行程序的计数？
2018-03-13 20:43

回答 1 已采纳 Use deferred function that will recover from panic. func count() { err := recover() if er
hadoop运行jar包的那些事 hadoop java mapreduce
2023-03-22 00:06

回答 2 已采纳 1.、程序执行出现Error: java.lang.NullPointerException空指针异常，确保java程序的正确。变量什么的使用前先实例化声明，不要有数组越界之类的现象。检查程序。2、执
【深度学习】用 YOLO v5+DeepSORT，打造实时多目标跟踪模型
2021-08-05 11:59

风度78的博客相关论文： https://arxiv.org/pdf/1602.00763.pdf 2、DeepSORT DeepSORT 是 SORT 的升级版，它整合了外观信息 (appearance information) 从而提高 SORT 的性能，这使得我们在遇到较长时间的遮挡时，也能够正常跟踪...
没有报错，但是运行不了 python
2021-10-24 17:26

回答 1 已采纳你现在连程序入口都没有，怎么运行啊
Snowball Edge-Golang中的aws-sdk-go软件包-无法连接到S3
2018-03-14 17:36

回答 1 已采纳 Snowball Edge is a very different beast than is AWS S3. In addition to the access key and secret a
在应用程序中处理NULL值并发送到数据库
2018-02-01 16:19

回答 1 已采纳 CONCERN 1 is easily remedied by adding a getter method for your fields func (l Location) GetTitle
编程面试中需要了解的5件事
2020-08-08 00:18

cumi7754的博客如果您正在使用某种编程语言的深奥特性，那么在编写完全部内容之后就可以对其进行解释。在编码会话中这意味着什么 (What this means in a coding session) If you have already established some way of solving ...
Dependency-Track页面Risk core列没有值，怎么解决 web安全性能优化系统安全
2021-11-29 10:25

回答 1 已采纳 I expect to see vulnerable components but I don’tMost common reason: You have yet to enable the Sona
python开发中级_针对中级Python开发人员的13个项目构想
2020-07-13 22:25

cumei1658的博客更好地理解编程概念：您将学习更好地编写代码，并理解诸如设计模式和面向对象编程之类的概念。体验完整的软件开发生命周期：您将学习如何在编写代码之前进行计划，管理编码过程以及更新软件。 There is a lot to...
语音转换成文本技术实现_职业转换者指南，帮助您实现梦想的技术工作
2020-08-13 15:43

cumian8165的博客鉴于我以前没有使用过机器人技术或电子产品的经验，因此我着手制造了可以在我的客厅中运行的深度学习/自动驾驶机器人汽车DeepPiCar 。 One month later, after I successfully built the self-driving car, I ...
mcu比较器技巧和诀窍_如何准备技术面试-技巧和窍门，以帮助您表现最好
2020-08-13 05:22

cumi6497的博客最重要的是，许多使用白板面试的地方还提出了一些面试问题，坦率地说，这些问题对99％的编程工作毫无价值。这些是可怕的计算机科学算法：反转二叉树，在图形中找到最短路径等。 The problem with these questions ...
切换到Android吗？这是您需要知道的一切
2020-09-14 09:40

culinqian4296的博客 For Google searches, I’d recommend going with something like “How to on .” So, for example, “How to change the wallpaper on Galaxy S9 Android 8.0.” 现在，您知道遇到问题时要寻找的内容。...
华夏常春藤_我如何在没有常春藤大学学位的情况下从微软，亚马逊和Twitter获取报价...
2020-07-20 12:15

cumian8165的博客要解决此问题，我通过VPN运行了脚本，并设置了一个计时器，该计时器每隔几分钟左右就会暂停脚本。它并不完美，但是效果很好。 At the end of it, I collected about 500 emails from around San Francisco, ...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 5月6日

悬赏问题

¥15 treelib库有读取树数据方法吗？
¥15 咨询一个PYTHON的问题
¥15 机器学习建模调参，roc评价指标
¥15 RCS plot 包内置数据集使用时报错，如何解决？
¥15 keil+mspm0g3507+二维总线舵机
¥15 如何用wireshark分析找出url接口和param参数
¥15 有谁知道这是阿里云那个应用的域名吗，怎么调用？
¥30 正则表达式的一些问题
¥15 C#如何使用不需要安装 Microsoft Excel 的机器上的方法或者库实现：将指定Excel区域导出为图片（例如A1:AO50）
¥15 虚拟机只能接收不能发送

运行deepsort的track遇到的问题

5条回答 默认 最新

问题事件

悬赏问题

5条回答默认最新