保存标注对象到txt 制作xml

1、算法将检测的目标名称和目标位置保存到txt文本

图片名 xmin ymin xmax ymax

(4).avi237face.jpg
4
smoke 83 234 142 251
hand 119 255 271 306
eye 178 148 216 163
eye 111 156 148 173

#!/usr/bin/python

# -*- coding: UTF-8 -*-

import os, h5py, cv2, sys, shutil

import numpy as np

from xml.dom.minidom import Document

rootdir = "G:/MTCNNTraining/faceData/train"

convet2yoloformat = True

convert2vocformat = True

resized_dim = (48, 48)

# 最小取20大小的脸，并且补齐

minsize2select = 1

usepadding = True

def convertimgset(img_set="train"):

    imgdir = rootdir + "/trainImages"

    gtfilepath = rootdir + "/SSDSave.txt"

    imagesdir = rootdir + "/images"

    vocannotationdir = rootdir + "/Annotations"

    labelsdir = rootdir + "/labels"

    if not os.path.exists(imagesdir):

        os.mkdir(imagesdir)

    if convet2yoloformat:

        if not os.path.exists(labelsdir):

            os.mkdir(labelsdir)

    if convert2vocformat:

        if not os.path.exists(vocannotationdir):

            os.mkdir(vocannotationdir)

    index = 0

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            sys.stdout.write("\r" + str(index) + ":" + filename + "\t\t\t")

            sys.stdout.flush()

            imgpath = imgdir + "/" + filename

            img = cv2.imread(imgpath)

            if not img.data:

                break

            imgheight = img.shape[0]

            imgwidth = img.shape[1]

            maxl = max(imgheight, imgwidth)

            paddingleft = (maxl - imgwidth) >> 1

            paddingright = (maxl - imgwidth) >> 1

            paddingbottom = (maxl - imgheight) >> 1

            paddingtop = (maxl - imgheight) >> 1

            saveimg = cv2.copyMakeBorder(img, paddingtop, paddingbottom, paddingleft, paddingright, cv2.BORDER_CONSTANT,value=0)

            showimg = saveimg.copy()

            numbbox = int(gtfile.readline())

            bboxes = []

            bnames=[]

            for i in range(numbbox):

                line_read = gtfile.readline()

                line_cor = line_read.strip().split(" ")

                obj_name = line_cor[0]

                #line = line_cor[1:5]

                line = list(map(int,line_cor[1:5]))

                if (int(line[3]) <= 0 or int(line[2]) <= 0):

                    continue

                x = int(line[0]) + paddingleft #左上角顶点x

                y = int(line[1]) + paddingtop #左上角顶点y

                width = int(line[2]) - int(line[0]) + 1 #宽度

                height = int(line[3]) - int(line[1])+ 1 #高度

                bbox = (x, y, width, height)

                #x2 = x + width

                #y2 = y + height

                # face=img[x:x2,y:y2]

                if width >= minsize2select and height >= minsize2select:

                    bboxes.append(bbox)

                    bnames.append(obj_name)

                    #cv2.rectangle(showimg, (x, y), (x2, y2), (0, 255, 0))

                    # maxl=max(width,height)

                    # x3=(int)(x+(width-maxl)*0.5)

                    # y3=(int)(y+(height-maxl)*0.5)

                    # x4=(int)(x3+maxl)

                    # y4=(int)(y3+maxl)

                    # cv2.rectangle(img,(x3,y3),(x4,y4),(255,0,0))

                #else:

                    #cv2.rectangle(showimg, (x, y), (x2, y2), (0, 0, 255))

            #filename = filename.replace("/", "_")

            if len(bboxes) == 0:

                print ("warrning: no face")

                continue

            cv2.imwrite(imagesdir + "/" + filename, saveimg)

            #if convet2yoloformat:

                #height = saveimg.shape[0]

                #width = saveimg.shape[1]

                #txtpath = labelsdir + "/" + filename

                #txtpath = txtpath[:-3] + "txt"

                #ftxt = open(txtpath, 'w')

                #for i in range(len(bboxes)):

                    #bbox = bboxes[i]

                    #xcenter = (bbox[0] + bbox[2] * 0.5) / width

                    #ycenter = (bbox[1] + bbox[3] * 0.5) / height

                    #wr = bbox[2] * 1.0 / width

                    #hr = bbox[3] * 1.0 / height

                    #txtline = "0 " + str(xcenter) + " " + str(ycenter) + " " + str(wr) + " " + str(hr) + "\n"

                    #ftxt.write(txtline)

                #ftxt.close()

            if convert2vocformat:

                xmlpath = vocannotationdir + "/" + filename

                xmlpath = xmlpath[:-3] + "xml"

                doc = Document()

                annotation = doc.createElement('annotation')

                doc.appendChild(annotation)

                folder = doc.createElement('folder')

                folder_name = doc.createTextNode('widerface')

                folder.appendChild(folder_name)

                annotation.appendChild(folder)

                filenamenode = doc.createElement('filename')

                filename_name = doc.createTextNode(filename)

                filenamenode.appendChild(filename_name)

                annotation.appendChild(filenamenode)

                source = doc.createElement('source')

                annotation.appendChild(source)

                database = doc.createElement('database')

                database.appendChild(doc.createTextNode('wider face Database'))

                source.appendChild(database)

                annotation_s = doc.createElement('annotation')

                annotation_s.appendChild(doc.createTextNode('PASCAL VOC2007'))

                source.appendChild(annotation_s)

                image = doc.createElement('image')

                image.appendChild(doc.createTextNode('flickr'))

                source.appendChild(image)

                flickrid = doc.createElement('flickrid')

                flickrid.appendChild(doc.createTextNode('-1'))

                source.appendChild(flickrid)

                owner = doc.createElement('owner')

                annotation.appendChild(owner)

                flickrid_o = doc.createElement('flickrid')

                flickrid_o.appendChild(doc.createTextNode('widerFace'))

                owner.appendChild(flickrid_o)

                name_o = doc.createElement('name')

                name_o.appendChild(doc.createTextNode('widerFace'))

                owner.appendChild(name_o)

                size = doc.createElement('size')

                annotation.appendChild(size)

                width = doc.createElement('width')

                width.appendChild(doc.createTextNode(str(saveimg.shape[1])))

                height = doc.createElement('height')

                height.appendChild(doc.createTextNode(str(saveimg.shape[0])))

                depth = doc.createElement('depth')

                depth.appendChild(doc.createTextNode(str(saveimg.shape[2])))

                size.appendChild(width)

                size.appendChild(height)

                size.appendChild(depth)

                segmented = doc.createElement('segmented')

                segmented.appendChild(doc.createTextNode(''))

                annotation.appendChild(segmented)

                for i in range(len(bboxes)):

                    bbox = bboxes[i]

                    objects = doc.createElement('object')

                    annotation.appendChild(objects)

                    object_name = doc.createElement('name')

                    bnames_var = str(bnames[i])

                    object_name.appendChild(doc.createTextNode(bnames_var))

                    objects.appendChild(object_name)

                    pose = doc.createElement('pose')

                    pose.appendChild(doc.createTextNode('Unspecified'))

                    objects.appendChild(pose)

                    truncated = doc.createElement('truncated')

                    truncated.appendChild(doc.createTextNode(''))

                    objects.appendChild(truncated)

                    difficult = doc.createElement('difficult')

                    difficult.appendChild(doc.createTextNode(''))

                    objects.appendChild(difficult)

                    bndbox = doc.createElement('bndbox')

                    objects.appendChild(bndbox)

                    xmin = doc.createElement('xmin')

                    xmin.appendChild(doc.createTextNode(str(bbox[0])))

                    bndbox.appendChild(xmin)

                    ymin = doc.createElement('ymin')

                    ymin.appendChild(doc.createTextNode(str(bbox[1])))

                    bndbox.appendChild(ymin)

                    xmax = doc.createElement('xmax')

                    xmax.appendChild(doc.createTextNode(str(bbox[0] + bbox[2])))

                    bndbox.appendChild(xmax)

                    ymax = doc.createElement('ymax')

                    ymax.appendChild(doc.createTextNode(str(bbox[1] + bbox[3])))

                    bndbox.appendChild(ymax)

                f = open(xmlpath, "w")

                f.write(doc.toprettyxml(indent=''))

                f.close()

                # cv2.imshow("img",showimg)

            # cv2.waitKey()

            index = index + 1

def convertdataset():

    img_sets = ["train"]

    for img_set in img_sets:

        convertimgset(img_set)

if __name__ == "__main__":

    convertdataset()

保存标注对象到txt 制作xml的更多相关文章

OpenCV训练分类器制作xml文档
OpenCV训练分类器制作xml文档 (2011-08-25 15:50:06) 转载▼ 标签: 杂谈分类: 学习我的问题:有了opencv自带的那些xml人脸检测文档,我们就可以用cvLoad( ...
Adobe AIR and Flex - 保存序列化对象文件（译）
创建任何桌面应用程序几乎总是需要在本地存储数据,通过Adobe AIR我们有几下面几个选择,一个是我们能够使用内置的 SQLite 数据库支持,对于少量的数据这是大材小用了.另外一个选择是我们通过把数 ...
Java 将Word转为PDF、PNG、SVG、RTF、XPS、TXT、XML
同一文档在不同的编译或阅读环境中,需要使用特定的文档格式来打开,通常需要通过转换文档格式的方式来实现.下面将介绍在Java程序中如何来转换Word文档为其他几种常见文档格式,如PDF.图片png.sv ...
网站robots.txt & sitemap.xml
1. 如何查看网站的robots.txt 网址/robots.txt, 比如小米 https://www.mi.com/robots.txt sitemap.xml
NSUserDefault 保存自定义对象
由于NSUserDefaults 不支持保存自定类,保存的对象需要实现NSCoding协议,不过自定的类型就算实现了NSCoding也不可以保存,可以通过以下方法实现: //h文件 #import & ...
solr6.6 导入文本（txt/json/xml/csv）文件
参照:solr6.6 导入 pdf文件重点就是三个配置文件 1.建立的data-config.xml 内容如下: <dataConfig> <dataSource name=&qu ...
Tomcat关闭后,重新启动,session中保存的对象为什么还存在解决方法
Tomcat关闭后,重新启动,session中保存的对象为什么还存在各们朋友大家好: 当我关闭Tomcat,重新启动后,session中保存的对象还依然存在,仍然可以使用,不知这是什么 ...
在MySQL中保存Java对象
需要在MySQL中保存Java对象. 说明: 对象必须实现序列化 MySQL中对应字段设置为blob 将Java对象序列化为byte[] public static byte[] obj2byte(O ...
Map集合的遍历方式以及TreeMap集合保存自定义对象实现比较的Comparable和Comparator两种方式
Map集合的特点 1.Map集合中保存的都是键值对,键和值是一一对应的 2.一个映射不能包含重复的值 3.每个键最多只能映射到一个值上 Map接口和Collection接口的不同 Map是双列集合的根 ...

随机推荐

vue评论显示隐藏，JavaScript显示关闭
<template> <div id="vue_det"> <h1>{{details()}}</h1> <div>{{ ...
Error:java: Annotation processing is not supported for module cycles. Please ensure that all modules from cycle [web_dao,web_service] are excluded from annotation processing
早上学习maven环境搭建时遇到的这个问题下面这个错误的大概意思是:模块之间的互相依赖 Error:java: Annotation processing is not supported for ...
com.mysql.cj.core.exceptions.InvalidConnectionAttributeException: The server time zone value '�й�� mysql-installer-community-8.0.15.0
<properties> <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding> &l ...
[CentOS] rsync同步目录进行备份文件
操作不难,网上一堆.这里列几个 CentOS7 参考地址: https://www.server-world.info/en/note?os=CentOS_7&p=rsync Copy fil ...
Mysql千万级大数据量查询优化
来源于:https://blog.csdn.net/A350204530/article/details/79040277 1.对查询进行优化,应尽量避免全表扫描,首先应考虑在 where 及 ord ...
Flask实战-留言板-使用Flask-DebugToolbar调试程序、Flask配置的两种组织形式
使用Flask-DebugToolbar调试程序扩展Flask-DebugToolbar提供了一系列调试功能,可以用来查看请求的SQL语句.配置选项.资源加载情况等信息.这些信息在开发时会非常有用. ...
Python爬虫与一汽项目【一】爬取中海油，邮政，国家电网问题总结
项目介绍中国海洋石油是爬取的第一个企业,之后依次爬取了,国家电网,中国邮政,这三家公司的源码并没有多大难度, 采购信息地址: 国家电网电子商务平台 http://ecp.sgcc.com.cn/pr ...
MySQL复制表-INSERT INTO SELECT
基础table为: mysql> select * from staff; +----+----------+-------+ | id | name | slary | +----+----- ...
MTK-LCM 屏幕使用fbconfig/PanelMaster来调试LCM驱动
屏幕调试是我们做的较多的工作,且以MIPI屏为主,调试时总是会遇到一些参数需要一点一点配的时候,这样的工作其实很是繁琐,在我们确认完硬件没有问题时能不能使用简易的方法来解决这个问题呢 ? MTK已经为 ...
sdoi2018旧试题证明

保存标注对象到txt 制作xml

保存标注对象到txt 制作xml的更多相关文章

随机推荐

热门专题