python代码，请问为什么出现下面的报错？应该如何解决？

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import cv2
import numpy as np
from cnocr import CnOcr
import pandas as pd
from pandas import DataFrame
import os
import onnx
# 后续生成票据图像时的大小，按照标准增值税发票版式240mmX140mm来设定
height_resize = 1400
width_resize = 2400


# 调整原始图片尺寸
def resizeImg(image, height=height_resize):
    h, w = image.shape[:2]
    pro = height / h
    size = (int(w * pro), int(height))
    img = cv2.resize(image, size)
    return img


# 边缘检测
def getCanny(image):
    # 高斯模糊
    binary = cv2.GaussianBlur(image, (3, 3), 2, 2)
    # 边缘检测
    binary = cv2.Canny(binary, 60, 240, apertureSize=3)
    # 膨胀操作，尽量使边缘闭合
    kernel = np.ones((3, 3), np.uint8)
    binary = cv2.dilate(binary, kernel, iterations=1)
    return binary


# 求出面积最大的轮廓
def findMaxContour(image):
    # 寻找边缘
    contours, _ = cv2.findContours(image, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)
    # 计算面积
    max_area = 0.0
    max_contour = []
    for contour in contours:
        currentArea = cv2.contourArea(contour)
        if currentArea > max_area:
            max_area = currentArea
            max_contour = contour
    return max_contour, max_area


# 多边形拟合凸包的四个顶点
def getBoxPoint(contour):
    # 多边形拟合凸包
    hull = cv2.convexHull(contour)
    epsilon = 0.02 * cv2.arcLength(contour, True)
    approx = cv2.approxPolyDP(hull, epsilon, True)
    approx = approx.reshape((len(approx), 2))
    return approx


# 适配原四边形点集
def adapPoint(box, pro):
    box_pro = box
    if pro != 1.0:
        box_pro = box / pro
    box_pro = np.trunc(box_pro)
    return box_pro


# 四边形顶点排序，[top-left, top-right, bottom-right, bottom-left]
def orderPoints(pts):
    rect = np.zeros((4, 2), dtype="float32")
    s = pts.sum(axis=1)
    rect[0] = pts[np.argmin(s)]
    rect[2] = pts[np.argmax(s)]
    diff = np.diff(pts, axis=1)
    rect[1] = pts[np.argmin(diff)]
    rect[3] = pts[np.argmax(diff)]
    return rect


# 计算长宽
def pointDistance(a, b):
    return int(np.sqrt(np.sum(np.square(a - b))))


# 透视变换
def warpImage(image, box):
    w, h = pointDistance(box[0], box[1]), \
           pointDistance(box[1], box[2])
    dst_rect = np.array([[0, 0],
                         [w - 1, 0],
                         [w - 1, h - 1],
                         [0, h - 1]], dtype='float32')
    M = cv2.getPerspectiveTransform(box, dst_rect)
    warped = cv2.warpPerspective(image, M, (w, h))
    return warped


# 统合图片预处理
def imagePreProcessing(path):
    image = cv2.imread(path)
    # 转灰度、降噪
    # image = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
    # image = cv2.GaussianBlur(image, (3,3), 0)
    # 边缘检测、寻找轮廓、确定顶点
    ratio = height_resize / image.shape[0]
    img = resizeImg(image)
    binary_img = getCanny(img)
    max_contour, max_area = findMaxContour(binary_img)
    boxes = getBoxPoint(max_contour)
    boxes = adapPoint(boxes, ratio)
    boxes = orderPoints(boxes)
    # 透视变化
    warped = warpImage(image, boxes)
    # 调整最终图片大小
    height, width = warped.shape[:2]
    # size = (int(width*height_resize/height), height_resize)
    size = (width_resize, height_resize)
    warped = cv2.resize(warped, size, interpolation=cv2.INTER_CUBIC)
    return warped


# 截取图片中部分区域图像，测试阶段使用，包括显示与保存图片，实际使用时不使用这个函数，使用下面的正式版函数
def cropImage_test(img, crop_range, filename='Undefined'):
    xpos, ypos, width, height = crop_range
    crop = img[ypos:ypos + height, xpos:xpos + width]
    if filename == 'Undefined':  # 如果未指定文件名，采用坐标来指定文件名
        filename = 'crop-' + str(xpos) + '-' + str(ypos) + '-' + str(width) + '-' + str(height) + '.jpg'
    cv2.imshow(filename, crop)  # 展示截取区域图片---测试用
    # cv2.imwrite(filename, crop) #imwrite在文件名含有中文时会有乱码，应该采用下方imencode---测试用
    # 保存截取区域图片---测试用
    cv2.imencode('.jpg', crop)[1].tofile(filename)
    return crop


# 截取图片中部分区域图像
def cropImage(img, crop_range):
    xpos, ypos, width, height = crop_range
    crop = img[ypos:ypos + height, xpos:xpos + width]
    return crop


# 从截取图片中识别文字
def cropOCR(crop, ocrType):
    if ocrType == 0:
        text_crop_list = ocr.ocr_for_single_line(crop)
    elif ocrType == 1:
        text_crop_list = ocr_numbers.ocr_for_single_line(crop)
    elif ocrType == 2:
        text_crop_list = ocr_UpperSerial.ocr_for_single_line(crop)
    text_crop = ''.join(text_crop_list)
    return text_crop


if __name__ == '__main__':
    # 实例化不同用途CnOcr对象
    ocr = CnOcr(name='')  # 混合字符
    ocr_numbers = CnOcr(name='numbers', cand_alphabet='0123456789')  # 纯数字
    ocr_UpperSerial = CnOcr(name='UpperSerial',
                            cand_alphabet='0123456789ABCDEFGHIJKLMNPQRSTUVWXYZ')  # 编号，只包括大写字母(没有O)与数字

    # 截取图片中部分区域图像-名称
    crop_range_list_name = ['发票代码', '发票号码', '开票日期',
                            '校验码', '销售方名称', '销售方纳税人识别号',
                            '销售方地址电话', '销售方开户行及账号', '价税合计',
                            '备注']

    # 截取图片中部分区域图像-坐标
    crop_range_list_data = [[1870, 40, 380, 38], [1867, 104, 380, 38], [1866, 166, 380, 50],
                            [1867, 230, 450, 50], [421, 1046, 933, 46], [419, 1091, 933, 48],
                            [420, 1145, 933, 47], [421, 1193, 933, 40], [1892, 976, 414, 48],
                            [1455, 1045, 325, 38]]

    # 截取图片中部分区域图像-使用ocr的类型，0：混合字符，1：纯数字，2：编号
    crop_range_list_type = [1, 1, 0,
                            1, 0, 2,
                            0, 0, 0,
                            0]

    # 预处理图像
    path = 'test.png'
    warped = imagePreProcessing(path)

    # 展示与保存预处理的图片---测试用
    # cv2.imshow('warpImage', warped)
    cv2.imwrite('result.jpg', warped)

    # 处理预处理图像并将结果保存到text_ocr列表中
    text_ocr = []
    for i in range(len(crop_range_list_data)):
        # filename = crop_range_list_name[i]+'.jpg' #测试阶段保存截取图片时使用的文件名，实际使用时不需要
        crop = cropImage(warped, crop_range_list_data[i])
        crop_text = cropOCR(crop, crop_range_list_type[i])
        crop_text = crop_text.replace('o', '0')  # 发票中不会有小写字母o，凡是出现o的都使用0替代
        print(crop_range_list_name[i], ':', crop_text)
        text_ocr.append(crop_text)

    # 按年月来保存结果到xlsx文件中，计算文件名
    date_temp = text_ocr[2].split('年')
    year_num = date_temp[0]
    month_num = date_temp[1].split('月')[0]
    filename = year_num + '-' + month_num + '.xlsx'

    # 如果文件还没建立，新建文件
    if not os.path.exists(filename):
        dic = {}
        for i in range(len(crop_range_list_name)):
            dic[crop_range_list_name[i]] = []
        df = pd.DataFrame(dic)
        df.to_excel(filename, index=False)

    data = pd.read_excel(filename)
    if not int(text_ocr[1]) in data['发票号码'].values.tolist():
        new_line_num = data.shape[0]
        data.loc[new_line_num] = text_ocr
        DataFrame(data).to_excel(filename, index=False, header=True)
    else:
        print(path, 'is already in', filename, '!')

    cv2.waitKey(0)

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

报告相同问题？

关注问题

为什么代码都可以运行了，还显示绿色，然后报错？ r语言有问必答
2022-02-24 10:31

回答 3 已采纳 python是解释性的语言你写个错误的语法，也能运行，并不像c语言那样有语法错误就拒绝给你编译至于为什么会显示绿色是因为你前面的引号用法错误导致后面的代码其实都在引号里，是字符串的一部分
网上找了个用python做五子棋游戏的代码但是运行后无效果请问有哪里出错了吗，代码如下。 pygame python 开发语言有问必答
2022-04-02 20:14

回答 2 已采纳你函数都没有调用啊,应该有一个主要函数来调用吧你代码是不是不全啊
运用python语言编写下面程序 python
2021-11-26 16:27

回答 1 已采纳 def isPrime(x): if x < 2: return 0 for i in range(2, x): if x % i == 0:
Python3.5以上版本lxml导入etree报错的解决方案
2020-12-25 18:57

在python中安装了lxml-4.2.1，在使用时发现导入etree时IDE中报错Unresolved reference 其实发现，不影响使用，可以正常运行，对于我这种要刨根问底的人不搞明白怎么能罢休了，要保证代码不红就研究了下源码，通过...
为什么我的函数命令突然执行不了了呀？ python 开发语言
2022-01-25 13:52

回答 3 已采纳换个别的名字？
python中下载tesserocr报错 python
2022-09-11 12:26

回答 2 已采纳给你找了一篇非常好的博客，你可以看看是否有帮助，链接：Python安装tesserocr遇到的坑
两列时间序列数据怎么用apriori算法做关联分析呢？(语言-python) python 数据分析算法
2022-06-01 14:01

回答 3 已采纳原始数据—>滑动窗口L=10截取原始数据得到N个子序列—>线性拟合—>标准化斜率—>子序列符号化处理—>Apriori算法我觉得这个说的挺清楚的啊，关联算法本身解决的是各
Python使用pickle模块存储数据报错解决示例代码
2020-12-25 02:08

本文研究的主要是Python使用pickle模块存储数据报错解决方法，以代码的形式展示，具体如下。首先来了解下pickle模块 pickle提供了一个简单的持久化功能。可以将对象以文件的形式存放在磁盘上。 pickle模块只能在...
python中，strip()用来做什么，errmsg是关键字还是函数，用来做什么 python 开发语言
2021-12-17 17:25

回答 2 已采纳 strip用来删除开头、结尾的字符，类似C#语言里的trim函数strip函数可以带参数，比如写a.strip(b)，那么把a开头和结尾包含字符串b的部分全部删除（重复多次也一并删除）如果不填参数，默
如何写高质量的提问和回答？问答团队
2021-06-03 11:39

回答 2 已采纳不支持给代码，但还是一大堆的人给代码。很多还是学生，为了考试或者什么求代码，这种给代码就是害人家！
attribute error (dataframe) python 开发语言
2022-10-08 18:56

回答 1 已采纳 xlsx.interrows 改为 xlsx.iterrows
Python代码报错看不懂？记住这20个报错提示单词轻松解决bug
2022-07-15 12:11

小詹学 Python的博客 indexerror: list index out of range索引错误：列表超出索引范围（检查列表是否为空） 1) list [lɪst] 列表 2) index [ˈɪndeks] 索引 3) error [ˈerər] 错误 4) range [reɪndʒ] 范围 5. typeerror: must be...
根据id删除出现异常不知如何解决
2012-11-25 02:02

回答 1 已采纳 hibernateTemplate.delete(s),s不应该是id的值，delete（Object entity），你可以根据id值将要删除的实体查询出来，然后再删除
Python2包含中文报错的解决方法
2021-01-21 17:41

最近在工作中遇到一个问题，通过查找相关的解决方法终于解决，下面话不多说了，来一起看看详细的介绍吧命令行会出现如下错误信息 SyntaxError: Non-ASCII character ‘\xe8’ in file Python注释.py on line 1, ...
Python的10个常见报错和解决方法
2024-08-14 08:41

途途途途的博客想象一下，写信时漏掉了某个单词，这会让收信人不明白你的意思，编程也是一样，任何语法错误都会导致代码无法运行。这个错误表示你尝试访问一个未定义的变量或函数。确保所有变量在使用前都已经被正确定义。类比 ...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
系统已结题 9月5日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 8月28日

悬赏问题

¥15 c++ gmssl sm2验签demo
¥15 关于模的完全剩余系(关键词-数学方法)
¥15 有没有人懂这个博图程序怎么写，还要跟SFB连接，真的不会，求帮助
¥30 模拟电路 logisim
¥15 PVE8.2.7无法成功使用a5000的vGPU，什么原因
¥15 is not in the mmseg::model registry。报错，模型注册表找不到自定义模块。
¥15 安装quartus II18.1时弹出此error，怎么解决？
¥15 keil官网下载psn序列号在哪
¥15 想用adb命令做一个通话软件，播放录音
¥30 Pytorch深度学习服务器跑不通问题解决？

python代码，请问为什么出现下面的报错？应该如何解决？

0条回答 默认 最新

问题事件

悬赏问题

0条回答默认最新