widerface数据集voc格式转换tfrecord格式


from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import hashlib
import io
import logging
import os

from lxml import etree
import PIL.Image
import tensorflow as tf

from object_detection.utils import dataset_util
from object_detection.utils import label_map_util

flags = tf.flags
flags.DEFINE_string('data_dir', '', 'Root directory to raw PASCAL VOC dataset.')
flags.DEFINE_string('set', 'train', 'Convert training set, validation set or '
                                    'merged set.')
flags.DEFINE_string('annotations_dir', 'Annotations',
                    '(Relative) path to annotations directory.')
flags.DEFINE_string('year', 'VOC2007', 'Desired challenge year.')
flags.DEFINE_string('output_path', '', 'Path to output TFRecord')
flags.DEFINE_string('label_map_path', 'data/pascal_label_map.pbtxt',
                    'Path to label map proto')
flags.DEFINE_boolean('ignore_difficult_instances', False, 'Whether to ignore '
                                                          'difficult instances')
FLAGS = flags.FLAGS

SETS = ['train', 'val', 'trainval', 'test']
YEARS = ['fddb', 'widerface']


def dict_to_tf_example(data,
                       dataset_directory,
                       label_map_dict,
                       ignore_difficult_instances=False,
                       image_subdirectory='JPEGImages'):
    """Convert XML derived dict to tf.Example proto.
  Notice that this function normalizes the bounding box coordinates provided
  by the raw data.
  Args:
    data: dict holding PASCAL XML fields for a single image (obtained by
      running dataset_util.recursive_parse_xml_to_dict)
    dataset_directory: Path to root directory holding PASCAL dataset
    label_map_dict: A map from string label names to integers ids.
    ignore_difficult_instances: Whether to skip difficult instances in the
      dataset  (default: False).
    image_subdirectory: String specifying subdirectory within the
      PASCAL dataset directory holding the actual image data.
  Returns:
    example: The converted tf.Example.
  Raises:
    ValueError: if the image pointed to by data['filename'] is not a valid JPEG
  """
    img_path = os.path.join(data['folder'], image_subdirectory, data['filename'])
    full_path = os.path.join(dataset_directory, img_path)
    with tf.gfile.GFile(full_path, 'rb') as fid:
        encoded_jpg = fid.read()
    encoded_jpg_io = io.BytesIO(encoded_jpg)
    image = PIL.Image.open(encoded_jpg_io)
    if image.format != 'JPEG':
        raise ValueError('Image format not JPEG')
    key = hashlib.sha256(encoded_jpg).hexdigest()

    width = int(data['size']['width'])
    height = int(data['size']['height'])

    xmin = []
    ymin = []
    xmax = []
    ymax = []
    classes = []
    classes_text = []
    truncated = []
    poses = []
    difficult_obj = []
    if 'object' in data:
        for obj in data['object']:
            difficult = bool(int(obj['difficult']))
            if ignore_difficult_instances and difficult:
                continue

            difficult_obj.append(int(difficult))

            xmin.append(float(obj['bndbox']['xmin']) / width)
            ymin.append(float(obj['bndbox']['ymin']) / height)
            xmax.append(float(obj['bndbox']['xmax']) / width)
            ymax.append(float(obj['bndbox']['ymax']) / height)
            classes_text.append(obj['name'].encode('utf8'))
            classes.append(label_map_dict[obj['name']])
            truncated.append(int(obj['truncated']))
            poses.append(obj['pose'].encode('utf8'))

    example = tf.train.Example(features=tf.train.Features(feature={
        'image/height': dataset_util.int64_feature(height),
        'image/width': dataset_util.int64_feature(width),
        'image/filename': dataset_util.bytes_feature(
            data['filename'].encode('utf8')),
        'image/source_id': dataset_util.bytes_feature(
            data['filename'].encode('utf8')),
        'image/key/sha256': dataset_util.bytes_feature(key.encode('utf8')),
        'image/encoded': dataset_util.bytes_feature(encoded_jpg),
        'image/format': dataset_util.bytes_feature('jpeg'.encode('utf8')),
        'image/object/bbox/xmin': dataset_util.float_list_feature(xmin),
        'image/object/bbox/xmax': dataset_util.float_list_feature(xmax),
        'image/object/bbox/ymin': dataset_util.float_list_feature(ymin),
        'image/object/bbox/ymax': dataset_util.float_list_feature(ymax),
        'image/object/class/text': dataset_util.bytes_list_feature(classes_text),
        'image/object/class/label': dataset_util.int64_list_feature(classes),
        'image/object/difficult': dataset_util.int64_list_feature(difficult_obj),
        'image/object/truncated': dataset_util.int64_list_feature(truncated),
        'image/object/view': dataset_util.bytes_list_feature(poses),
    }))
    return example


def main(_):
    if FLAGS.set not in SETS:
        raise ValueError('set must be in : {}'.format(SETS))
    if FLAGS.year not in YEARS:
        raise ValueError('year must be in : {}'.format(YEARS))

    data_dir = FLAGS.data_dir
    years = ['fddb', 'widerface']
    if FLAGS.year != 'merged':
        years = [FLAGS.year]

    writer = tf.python_io.TFRecordWriter(FLAGS.output_path)

    label_map_dict = label_map_util.get_label_map_dict(FLAGS.label_map_path)

    for year in years:
        logging.info('Reading from PASCAL %s dataset.', year)
        examples_path = os.path.join(data_dir, year, 'ImageSets', 'Main',
                                     FLAGS.set + '.txt')
        annotations_dir = os.path.join(data_dir, year, FLAGS.annotations_dir)
        examples_list = dataset_util.read_examples_list(examples_path)
        for idx, example in enumerate(examples_list):
            if idx % 100 == 0:
                logging.info('On image %d of %d', idx, len(examples_list))
            path = os.path.join(annotations_dir, example + '.xml')
            with tf.gfile.GFile(path, 'r') as fid:
                xml_str = fid.read()
            xml = etree.fromstring(xml_str)
            data = dataset_util.recursive_parse_xml_to_dict(xml)['annotation']

            tf_example = dict_to_tf_example(data, FLAGS.data_dir, label_map_dict,
                                            FLAGS.ignore_difficult_instances)
            writer.write(tf_example.SerializeToString())

    writer.close()


if __name__ == '__main__':
    tf.app.run()

现在运行报错

Traceback (most recent call last):
  File "object_detection/dataset_tools/create_pascal_tf_record.py", line 179, in <module>
    tf.app.run()
  File "C:\Anaconda3\envs\tensorflow1\lib\site-packages\tensorflow\python\platform\app.py", line 125, in run
    _sys.exit(main(argv))
  File "object_detection/dataset_tools/create_pascal_tf_record.py", line 172, in main
    FLAGS.ignore_difficult_instances)
  File "object_detection/dataset_tools/create_pascal_tf_record.py", line 114, in dict_to_tf_example
    classes.append(label_map_dict[obj['name']])
KeyError: 'face'

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

1条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
像我这样奇怪的人 2021-04-13 11:08
关注
pascal_label_map.pbtxt这个文件错了，应该是face_label_map.pbtxt

解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

coco数据集和voc数据集 目标检测
2022-10-08 15:16

回答 1 已采纳格式没有影响，关键是精度有影响，你看下你转成coco的时候有没有对原来的浮点数进行取整操作
求VOC-360的数据集，谁下载过吗深度学习目标检测计算机视觉
2022-03-02 20:42

回答 1 已采纳下载2007年的训练数据wget http://host.robots.ox.ac.uk/pascal/VOC/voc2007/VOCtrainval_06-Nov-2007.tar 下载2007年的
航拍红外车辆数据集？天津大学？人工智能机器学习目标检测
2022-10-17 17:02

回答 2 已采纳问题1：需要修改成标注的voc数据格式才可以正常使用问题2：不了解
将WIDER FACE数据集转为VOC格式
2022-03-21 15:53

装满水杯的水的博客第一步：在Wider Face官网下载数据集，官网：Wider Face 下载下列四个压缩包第二步：下载完成后进行解压，解压完成之后新建三个文件夹，如下图所示在ImageSets文件夹下新建一个名为Main的文件夹，第...
训练retinanet时用自己的数据集 pytorch 人工智能神经网络
2021-07-12 10:10

回答 1 已采纳占位符问题，你这个前面只有一个占位符，后面却有两个变量，要有两个占位符吧,类似: 'VOCdevkit/VOC2012/ImageSets/Main/%s_%s.txt'%(year, image_s
Tensorflow object detection API 使用VOC数据集出现错误。 tensorflow 深度学习
2019-02-24 18:53

回答 1 已采纳假定程序本身是对的，那么你需要检查你的输入的数据是否正确，还有你的tensorflow的版本和你的程序作者用的版本是否兼容。 tf有很多版本彼此兼容性都不好，所以你要找和作者一致或者接近的版本跑你的
有没有包含xml文件的人脸识别数据集能够下载呢？ python 深度学习目标检测
2022-04-24 22:43

回答 1 已采纳我倒是有一个很基础的，都是xml文件，你要不？要的话发一下邮箱，我给你发过去
数据集VOC正版灭火器数据集VOC格式-5156张
2022-11-08 16:55

数据集格式：Pascal VOC格式(仅仅包含jpg图片和对应的xml) 图片数量(jpg文件个数)：5156 标注数量(xml文件个数)：5156 标注类别数：1 标注类别名称:["fe"] 每个类别标注的框数： fe count = 7762 使用标注工具：...
在yolov3下训练自己的数据集卡住 ubuntu 深度学习目标检测
2022-08-12 21:21

回答 2 已采纳看darknet的git，解决方案是将cuda升级到11.1，cudnn也升级，才能解决这个卡住的问题，和显卡有点关系
yolo数据集制作疑问 python 计算机视觉
2022-04-25 16:11

回答 1 已采纳 1.本质上差别不大，只不过标签格式不同，而两者数据集的标签也可以互相转化。2.因为只有格式上的区别，训练出的模型准确率差别很小，所以不必计较这个望采纳！谢谢
VOC2012用自己数据集转化为record数据时，成功但是0kb，请问知道是什么原因？？ tensorflow 机器学习深度学习
2020-04-17 15:01

回答 2 已采纳请参考：https://blog.csdn.net/ReversalC/article/details/93627310
目标检测之摔倒检测数据集，voc格式
2023-05-09 15:39

这个是从网上整理的资源，用于目标检测的摔倒检测数据集，格式是voc数据格式。由于是网上整理的数据集，用于学习和研究。
YOLOv5(PyTorch)实战：训练自己的数据集课程中遇到的问题 pytorch
2022-04-05 21:57

回答 1 已采纳 in "models/yolov5s_ball.yaml", line 5, column 1检查以下这个文件，这里出现的错误
道路裂缝数据集VOC格式-12988张
2022-06-29 10:06

数据集格式：Pascal VOC格式(不包含分割的txt文件，仅仅包含jpg图片和对应的xml) 图片数量(jpg文件个数)：12988 标注数量(xml文件个数)：12988 标注类别数：1 标注类别名称:["roadcrack"] 每个类别标注的框数： ...
widerface数据集转换为VOC程序.zip_TFRecord_Voc format_feweru64_wider_face
2022-09-22 14:33

将widerface的图片数据集转化为VOC格式的数据集，为了后期转化为TFrecord格式
没有解决我的问题, 去提问

悬赏问题

¥20 sub地址DHCP问题
¥15 delta降尺度计算的一些细节，有偿
¥15 Arduino红外遥控代码有问题
¥15 数值计算离散正交多项式
¥30 数值计算均差系数编程
¥15 redis-full-check比较两个集群的数据出错
¥15 Matlab编程问题
¥15 训练的多模态特征融合模型准确度很低怎么办
¥15 kylin启动报错log4j类冲突
¥15 超声波模块测距控制点灯，灯的闪烁很不稳定，经过调试发现测的距离偏大

widerface数据集voc格式转换tfrecord格式

1条回答 默认 最新

悬赏问题

1条回答默认最新