视频转化为3D模式，形成的火柴人动画与原视频差的太远

问题遇到的现象和发生背景

我使用这个软件自带的坤坤视频就没有问题，但是用自己的视频来跑就生成失败了

问题相关代码，请勿粘贴截图

运行结果及报错内容

我的解答思路和尝试过的方法

我想要达到的结果

import time

import cv2
import matplotlib.pyplot as plt
import numpy as np
from matplotlib.animation import FuncAnimation, writers
from matplotlib.backends.backend_agg import FigureCanvasAgg as FigureCanvas
from mpl_toolkits.mplot3d import Axes3D
from tqdm import tqdm

from common.utils import read_video


def ckpt_time(ckpt=None, display=0, desc=''):
    if not ckpt:
        return time.time()
    else:
        if display:
            print(desc + ' consume time {:0.4f}'.format(time.time() - float(ckpt)))
        return time.time() - float(ckpt), time.time()


def set_equal_aspect(ax, data):
    """
    Create white cubic bounding box to make sure that 3d axis is in equal aspect.
    :param ax: 3D axis
    :param data: shape of(frames, 3), generated from BVH using convert_bvh2dataset.py
    """
    X, Y, Z = data[..., 0], data[..., 1], data[..., 2]

    # Create cubic bounding box to simulate equal aspect ratio
    max_range = np.array([X.max() - X.min(), Y.max() - Y.min(), Z.max() - Z.min()]).max()
    Xb = 0.5 * max_range * np.mgrid[-1:2:2, -1:2:2, -1:2:2][0].flatten() + 0.5 * (X.max() + X.min())
    Yb = 0.5 * max_range * np.mgrid[-1:2:2, -1:2:2, -1:2:2][1].flatten() + 0.5 * (Y.max() + Y.min())
    Zb = 0.5 * max_range * np.mgrid[-1:2:2, -1:2:2, -1:2:2][2].flatten() + 0.5 * (Z.max() + Z.min())

    for xb, yb, zb in zip(Xb, Yb, Zb):
        ax.plot([xb], [yb], [zb], 'w')


def downsample_tensor(X, factor):
    length = X.shape[0] // factor * factor#//:对X.shape[0]除以factor的结果向负无穷方向取整后的数
    return np.mean(X[:length].reshape(-1, factor, *X.shape[1:]), axis=1)
    #[i:j]从下标i到下标j，截取序列s中的元素。i省略或者None时，就是0。
    #np.mean():求均值。axis=1,计算每一行的均值；axis=0，计算每一列的均值。
    #reshape（-1,a,b)。-1:表示列数固定，行数自动计算。
    #*X.shape。使用*号作为可变参数列表，就可以在方法内对参数进行调用，也就是解包（元组）。

#fps:画面每秒传输的帧数；bitrate：码率；azim：相对方位角；viewpor：可视窗口；
def render_animation(keypoints, poses, skeleton, fps, bitrate, azim, output, viewport,
                     limit=-1, downsample=1, size=6, input_video_path=None, input_video_skip=0):
    """
    TODO
    Render an animation. The supported output modes are:
     -- 'interactive': display an interactive figure
                       (also works on notebooks if associated with %matplotlib inline)
     -- 'html': render the animation as HTML5 video. Can be displayed in a notebook using HTML(...).
     -- 'filename.mp4': render and export the animation as an h264 video (requires ffmpeg).
     -- 'filename.gif': render and export the animation a gif file (requires imagemagick).
    """
    plt.ioff()  # 显示前关闭交互模式：保持界面停留
    fig = plt.figure(figsize=(size * (1 + len(poses)), size))  # 返回poses的值；弄张画板；size是高度，宽度是size * (1 + len(poses))
    ax_in = fig.add_subplot(1, 1 + len(poses), 1)
    ax_in.get_xaxis().set_visible(False)  # 控制坐标轴、标签是否显示
    ax_in.get_yaxis().set_visible(False)  # 控制坐标轴、标签是否显示
    ax_in.set_axis_off()  # 控制坐标轴、标签是否显示
    ax_in.set_title('Input')  # 设置标题

    # prevent wired error
    _ = Axes3D.__class__.__name__#获得类的名字

    ax_3d = []
    lines_3d = []
    trajectories = []#轨迹
    radius = 1.7
    for index, (title, data) in enumerate(poses.items()):#匹配，枚举
        # 3D
        ax = fig.add_subplot(1, 1 + len(poses), index + 2, projection='3d')#投影=3d
        ax.view_init(elev=15., azim=azim)
        # 设置长度范围
        ax.set_xlim3d([-radius / 2, radius / 2])
        ax.set_zlim3d([0, radius])
        ax.set_ylim3d([-radius / 2, radius / 2])
        # ax.set_aspect('equal')使各轴的单位相同
        ax.set_xticklabels([])
        ax.set_yticklabels([])
        ax.set_zticklabels([])
        ax.dist = 12.5
        # lxy add
        ax.set_xlabel('X Label')
        ax.set_ylabel('Y Label')
        ax.set_zlabel('Z Label')
        ax.set_title(title)  # , pad=35
        ax_3d.append(ax)
        lines_3d.append([])
        trajectories.append(data[:, 0, [0, 1]])
    poses = list(poses.values())

    # Decode video解码视频
    if input_video_path is None:#比较时，用“is None“而不是 ”== None“；”is“运算判断两个对象在内存中的地址是否一致；”==“ 运算符是比较对象的值是否相等。
        # Black background
        all_frames = np.zeros((keypoints.shape[0], viewport[1], viewport[0]), dtype='uint8')#在opencv-python中，若想为图像创建一个容器，需要指定dtype=np.uint8，否则虽然你的容器矩阵中是有值的，但是无法正常imshow
    else:
        # Load video using ffmpeg
        all_frames = []
        for f in read_video(input_video_path, fps=None, skip=input_video_skip):
            all_frames.append(f)

        effective_length = min(keypoints.shape[0], len(all_frames))#shape[0]:读取矩阵的第一维度的长度
        all_frames = all_frames[:effective_length]

    if downsample > 1:
        keypoints = downsample_tensor(keypoints, downsample)
        all_frames = downsample_tensor(np.array(all_frames), downsample).astype('uint8')#astype()改变np.array中所有数据元素的数据类型
        for idx in range(len(poses)):
            poses[idx] = downsample_tensor(poses[idx], downsample)
            trajectories[idx] = downsample_tensor(trajectories[idx], downsample)
        fps /= downsample#等效于fps=fps/downsample

    initialized = False
    image = None
    lines = []
    points = None

    if limit < 1:
        limit = len(all_frames)
    else:
        limit = min(limit, len(all_frames))

    parents = skeleton.parents()#.parents（）：返回上级目录
    pbar = tqdm(total=limit)#进度条

    def update_video(i):
        nonlocal initialized, image, lines, points  #nonlocal:在函数内部创建一个函数，该函数使用变量x作为非局部变量

        for n, ax in enumerate(ax_3d):
            #enumerate:python的内置函数，对于一个可迭代的（iterable）/可遍历的对象（如列表、字符串），enumerate将其组成一个索引序列，利用它可以同时获得索引和值，多用于在for循环中得到计数。
            ax.set_xlim3d([-radius / 2 + trajectories[n][i, 0], radius / 2 + trajectories[n][i, 0]])
            ax.set_ylim3d([-radius / 2 + trajectories[n][i, 1], radius / 2 + trajectories[n][i, 1]])

        # Update 2D poses
        if not initialized:
            image = ax_in.imshow(all_frames[i], aspect='equal')
            #aspect:两条坐标轴的纵横比，也就是Y轴显示长度除以X轴显示长度的比例，若想图像不失真，需设置为equal。

            for j, j_parent in enumerate(parents):
                if j_parent == -1:
                    continue

                # if len(parents) == keypoints.shape[1] and 1 == 2:
                #     # Draw skeleton only if keypoints match (otherwise we don't have the parents definition)
                #     lines.append(ax_in.plot([keypoints[i, j, 0], keypoints[i, j_parent, 0]],
                #                             [keypoints[i, j, 1], keypoints[i, j_parent, 1]], color='pink'))

                col = 'red' if j in skeleton.joints_right() else 'black'
                for n, ax in enumerate(ax_3d):
                    pos = poses[n][i]
                    lines_3d[n].append(ax.plot([pos[j, 0], pos[j_parent, 0]],
                                               [pos[j, 1], pos[j_parent, 1]],
                                               [pos[j, 2], pos[j_parent, 2]], zdir='z', c=col))

            points = ax_in.scatter(*keypoints[i].T, 5, color='red', edgecolors='white', zorder=10)

            initialized = True
        else:
            image.set_data(all_frames[i])

            for j, j_parent in enumerate(parents):
                if j_parent == -1:
                    continue

                # if len(parents) == keypoints.shape[1] and 1 == 2:
                #     lines[j - 1][0].set_data([keypoints[i, j, 0], keypoints[i, j_parent, 0]],
                #                              [keypoints[i, j, 1], keypoints[i, j_parent, 1]])

                for n, ax in enumerate(ax_3d):
                    pos = poses[n][i]
                    lines_3d[n][j - 1][0].set_xdata([pos[j, 0], pos[j_parent, 0]])
                    lines_3d[n][j - 1][0].set_ydata([pos[j, 1], pos[j_parent, 1]])
                    lines_3d[n][j - 1][0].set_3d_properties([pos[j, 2], pos[j_parent, 2]], zdir='z')

            points.set_offsets(keypoints[i])#生成动态散点图

        pbar.update()#进度条

    #fig.tight_layout()

    anim = FuncAnimation(fig, update_video, frames=limit, interval=1000.0 / fps, repeat=False)
    if output.endswith('.mp4'):#endswith：判断字符串是否以指定字符或子字符串结尾
        Writer = writers['ffmpeg']
        writer = Writer(fps=fps, metadata={}, bitrate=bitrate)#metadata:注明数据库信息的数据
        anim.save(output, writer=writer)
    elif output.endswith('.gif'):
        anim.save(output, dpi=60, writer='imagemagick')
    else:
        raise ValueError('Unsupported output format (only .mp4 and .gif are supported)')
    pbar.close()
    plt.close()


def render_animation_test(keypoints, poses, skeleton, fps, bitrate, azim, output, viewport, limit=-1, downsample=1,
                          size=6, input_video_frame=None, input_video_skip=0, num=None):
    t0 = ckpt_time()
    fig = plt.figure(figsize=(12, 6))
    canvas = FigureCanvas(fig)
    fig.add_subplot(121)
    plt.imshow(input_video_frame)
    # 3D
    ax = fig.add_subplot(122, projection='3d')
    ax.view_init(elev=15., azim=azim)
    # set 长度范围
    radius = 1.7
    ax.set_xlim3d([-radius / 2, radius / 2])
    ax.set_zlim3d([0, radius])
    ax.set_ylim3d([-radius / 2, radius / 2])
    ax.set_aspect('equal')
    # 坐标轴刻度
    ax.set_xticklabels([])
    ax.set_yticklabels([])
    ax.set_zticklabels([])
    ax.dist = 7.5

    # lxy add
    ax.set_xlabel('X Label')
    ax.set_ylabel('Y Label')
    ax.set_zlabel('Z Label')

    # array([-1,  0,  1,  2,  0,  4,  5,  0,  7,  8,  9,  8, 11, 12,  8, 14, 15])
    parents = skeleton.parents()

    pos = poses['Reconstruction'][-1]
    _, t1 = ckpt_time(t0, desc='1 ')
    for j, j_parent in enumerate(parents):
        if j_parent == -1:
            continue

        if len(parents) == keypoints.shape[1]:
            color_pink = 'pink'
            if j == 1 or j == 2:
                color_pink = 'black'

        col = 'red' if j in skeleton.joints_right() else 'black'
        # 画图3D
        ax.plot([pos[j, 0], pos[j_parent, 0]],
                [pos[j, 1], pos[j_parent, 1]],
                [pos[j, 2], pos[j_parent, 2]], zdir='z', c=col)

    #  plt.savefig('test/3Dimage_{}.png'.format(1000+num))
    width, height = fig.get_size_inches() * fig.get_dpi()
    _, t2 = ckpt_time(t1, desc='2 ')
    canvas.draw()  # draw the canvas, cache the renderer
    image = np.fromstring(canvas.tostring_rgb(), dtype='uint8').reshape(int(height), int(width), 3)
    cv2.imshow('im', image)
    cv2.waitKey(5)
    _, t3 = ckpt_time(t2, desc='3 ')
    return image

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

报告相同问题？

关注问题

A - 火柴棒等式：答案错误 c++
2022-01-10 22:58

回答 1 已采纳我的想法是，等式必须要用掉4根，整体火柴数量要-4，剩下的需要完成一个等式，即三个数字的加法满足自减4根的火柴数量，那么穷举所有的次数就能得出答案，不过得满足火柴总数相等以及等式成立
三堆火柴-博弈-笔试题 c# javascript typescript 有问必答
2021-07-09 22:14

回答 1 已采纳你题目的解答代码如下：（如有帮助，望采纳！谢谢! 点击我这个回答右上方的【采纳】按钮） var arr = [3,5,7]; var player = 1; while (true) { va
c语言火柴方程问题，萌新求教 c语言
2020-12-14 18:46

回答 1 已采纳 if(inout==1 || input ==2 ||input ==3) return (4-input); else return (input %2);
独立游戏人：像素风格游戏制作分享(转)
2019-10-04 07:18

dinghui1875的博客独立游戏人：像素风格游戏制作分享 ...我也想做像素风格的游戏，在经过一段时间的研究学习后，有了些心得，现在把我博客里的一篇文章贴出来，权当抛砖引玉，希望对同样喜欢像素风格，计划做像素游戏的人有所帮助。...
新Nim游戏
2017-02-11 15:08

回答 1 已采纳 http://blog.csdn.net/cyc66/article/details/48103337
想问下这个为什么会报错 eclipse 有问必答
2022-07-06 13:16

回答 3 已采纳 package com; interface fire{ public void Fireup(); //{ //System.out.println("点燃火柴"); //} } publi
关于#c语言#的问题：员工婚姻信息表，年份不知道为什么会输出成这样 c语言
2023-02-17 21:21

回答 1 已采纳年份打印有问题是因为下面这个 union 使用错了。 union marritalState //定义婚姻状况公用体类型 { int marryFlag; //婚姻状况标志，1 表示未婚，2
Unity RPG 黑暗之光问题记录上（1-63 地形场景角色选择行走相机跟随、旋转、缩放任务系统面板栏背包系统状态系统）
2021-06-26 19:48

weixin_39538253的博客 001 游戏预览和介绍职业选择鼠标点击移动旋转缩放药品装备任务NPC 状态装备技能存档 002 导入场景资源，搭建场景 3方资源：RPG NGUI StandarAssets 进去关闭自动生成（问题）模型贴图丢失改变Shader...
关于#c++#的问题：火柴棍拼数0-9的拼法，给定五位整数n需要用多少根火柴棍拼的出来 c++
2021-10-05 00:02

回答 1 已采纳 #include<bits/stdc++.h> using namespace std; int num[10001]={6,2,5,5,4,5,6,3,7,6}; int a[4],n,
火柴问题Matches
2016-12-30 14:05

回答 1 已采纳 http://poj.org/problem?id=3932
求各位大佬来讲解，救救孩子吧 c++ c语言有问必答
2021-05-22 22:02

回答 2 已采纳代码如下，如有帮助，请采纳一下，谢谢。 #include <stdio.h> #include <map> using namespace std; int main()
为没有历史的互联网留下历史——闪客帝国回忆录
2017-08-09 14:31

weixin_34372728的博客这意味着早期基于Flash开发的众多内容如游戏、网站、视频等内容，都将彻底消失并逐渐被遗忘。在网络带宽不高、流媒体尚未普及的互联网初期，体积很小且容易上手制作的Flash曾被很多国内网友“玩出花”。十几年前的...
华为hcip中级数通考几门?考试形式是什么? 网络协议网络安全
2022-09-12 21:49

回答 2 已采纳华为hcip认证数通考三门，分别为：HCIP-Routing & Switching-IERS、HCIP-Routing & Switching-IENP、HCIP-Routing & Switchi
CoreAnimation
2018-01-27 11:06

yz_Blog的博客一、图层的树状结构 ...你可能认为它只是用来做动画的，但实际上它是从一个叫做Layer Kit这么一个不怎么和动画有关的名字演变而来，所以做动画这只是Core Animation特性的冰山一角。 Core Animation是一个复合引擎
入局智能健身镜，小度破圈进行时
2021-12-10 20:51

Alter1230的博客如果是在2020年以前，这样的消息注定不会被太多人关注，彼时主打语音交互的智能助手还处于风口期，新品牌、新产品、新合作层出不穷。可当智能音箱在新冠疫情的影响下告别了高速增长，当外部舆论纷纷期待赛道玩家们下...
小学综合素质知识点
2022-02-13 16:13

m0_45903117的博客 &lt小于号 &gt大于号古典密码： 1nv151bl3m3554g3 知识点：教师职业道德修养含义一、教师职业道德修养的含义：是将教师职业道德要求转化为自己的信念并付诸行动的活动，简单说，是一种自我锻炼、自我改造、自我...
英语基础词汇
2022-02-19 11:52

神也小忐忑的博客凶残的人举止粗鲁的人 beat [biːt] n.敲打;(心脏等)跳动 v.打败;(心脏等)跳动 beach [biːtʃ] n.海滩湖滩河滩 blind [blaɪnd] a.盲的，瞎的；盲目的 vt.使失明 n.百叶窗 blouse [blaʊz] n.女衬衣，短上衣，...
java统一复习
2020-11-03 17:37

&曙光&的博客 5目录目录１基础篇４一、JDK常用的包４二、 Get和Post的区别４ ...十一、 Page和PageContext的区别７ ...七、 Forword(请求转发)与Redirect(重定向) ６八、JQurey总结６九、 XML和Json的特点６ .
2020 android面试题答案
2020-05-04 18:12

卖火柴的小男孩2020的博客解析：Java中方法调用的目标方法在Class文件里面都是常量池中的符号引用，在类加载的解析阶段，会将其中的一部分符号引用转化为直接引用。这种解析的前提是：方法在程序真正运行之前就有一个可以确定的调用版本，...
电脑史话
2014-11-16 16:38

hunterzone的博客 ”（英特尔华裔副总裁虞有澄语）据说，IBM公司后来围绕PC机的各项开发，投入的力量逐步达到450人，英特尔公司也组成“特殊客户部”为PC机供应高质量的芯片。　根据协定，微软公司应该为PC机提供包括BA
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
系统已结题 4月11日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
修改了问题 4月3日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 4月3日

悬赏问题

¥15 两台交换机分别是trunk接口和access接口为何无法通信，通信过程是如何？
¥15 C语言使用vscode编码错误
¥15 用KSV5转成本时，如何不生成那笔中间凭证
¥20 ensp怎么配置让PC1和PC2通讯上
¥50 有没有适合匹配类似图中的运动规律的图像处理算法
¥15 dnat基础问题,本机发出,别人返回的包,不能命中
¥15 请各位帮我看看是哪里出了问题
¥15 vs2019的js智能提示
¥15 关于#开发语言#的问题：FDTD建模问题图中代码没有报错，但是模型却变透明了
¥15 uniapp的h5项目写一个抽奖动画

视频转化为3D模式，形成的火柴人动画与原视频差的太远

问题遇到的现象和发生背景

问题相关代码，请勿粘贴截图

运行结果及报错内容

我的解答思路和尝试过的方法

我想要达到的结果

0条回答 默认 最新

问题事件

悬赏问题

0条回答默认最新