widerface---VOC

import os, h5py, cv2, sys, shutil

import numpy as np

from xml.dom.minidom import Document

rootdir = "G:/MTCNNTraining/faceData/widerFace"

convet2yoloformat = True

convert2vocformat = True

resized_dim = (48, 48)

# 最小取1大小的脸，并且补齐

minsize2select = 1

usepadding = True

datasetprefix = "G:/MTCNNTraining/faceData/widerFace"  #

def gen_hdf5():

    imgdir = rootdir + "/WIDER_train/images"

    gtfilepath = rootdir + "/wider_face_split/wider_face_train_bbx_gt.txt"

    index = 0

    with open(gtfilepath, 'r') as gtfile:

        faces = []

        labels = []

        while (True):  # and len(faces)<10

            imgpath = gtfile.readline()[:-1]

            if (imgpath == ""):

                break

            print (index, imgpath)

            img = cv2.imread(imgdir + "/" + imgpath)

            numbbox = int(gtfile.readline())

            bbox = []

            for i in range(numbbox):

                line = gtfile.readline()

                line = line.split()

                line = line[0:4]

                if (int(line[3]) <= 0 or int(line[2]) <= 0):

                    continue

                bbox = (int(line[0]), int(line[1]), int(line[2]), int(line[3]))

                face = img[int(line[1]):int(line[1]) + int(line[3]), int(line[0]):int(line[0]) + int(line[2])]

                face = cv2.resize(face, resized_dim)

                faces.append(face)

                labels.append(1)

                cv2.rectangle(img, (int(line[0]), int(line[1])),

                              (int(line[0]) + int(line[2]), int(line[1]) + int(line[3])), (255, 0, 0))

            # cv2.imshow("img",img)

            # cv2.waitKey(1)

            index = index + 1

        faces = np.asarray(faces)

        labels = np.asarray(labels)

        f = h5py.File('train.h5', 'w')

        f['data'] = faces.astype(np.float32)

        f['label'] = labels.astype(np.float32)

        f.close()

def viewginhdf5():

    f = h5py.File('train.h5', 'r')

    f.keys()

    faces = f['data'][:]

    for face in faces:

        face = face.astype(np.uint8)

        cv2.imshow("img", face)

        cv2.waitKey(1)

    f.close()

def convertimgset(img_set="train"):

    imgdir = rootdir + "/WIDER_" + img_set + "/images"

    gtfilepath = rootdir + "/wider_face_split/wider_face_" + img_set + "_bbx_gt.txt"

    imagesdir = rootdir + "/images"

    vocannotationdir = rootdir + "/Annotations"

    labelsdir = rootdir + "/labels"

    if not os.path.exists(imagesdir):

        os.mkdir(imagesdir)

    if convet2yoloformat:

        if not os.path.exists(labelsdir):

            os.mkdir(labelsdir)

    if convert2vocformat:

        if not os.path.exists(vocannotationdir):

            os.mkdir(vocannotationdir)

    index = 0

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            sys.stdout.write("\r" + str(index) + ":" + filename + "\t\t\t")

            sys.stdout.flush()

            imgpath = imgdir + "/" + filename

            img = cv2.imread(imgpath)

            if not img.data:

                break

            imgheight = img.shape[0]

            imgwidth = img.shape[1]

            maxl = max(imgheight, imgwidth)

            paddingleft = (maxl - imgwidth) >> 1

            paddingright = (maxl - imgwidth) >> 1

            paddingbottom = (maxl - imgheight) >> 1

            paddingtop = (maxl - imgheight) >> 1

            saveimg = cv2.copyMakeBorder(img, paddingtop, paddingbottom, paddingleft, paddingright, cv2.BORDER_CONSTANT,value=0)

            showimg = saveimg.copy()

            numbbox = int(gtfile.readline())

            bboxes = []

            for i in range(numbbox):

                line = gtfile.readline()

                line = line.split()

                line = line[0:4]

                if (int(line[3]) <= 0 or int(line[2]) <= 0):

                    continue

                x = int(line[0]) + paddingleft

                y = int(line[1]) + paddingtop

                width = int(line[2])

                height = int(line[3])

                bbox = (x, y, width, height)

                x2 = x + width

                y2 = y + height

                # face=img[x:x2,y:y2]

                if width >= minsize2select and height >= minsize2select:

                    bboxes.append(bbox)

                    cv2.rectangle(showimg, (x, y), (x2, y2), (0, 255, 0))

                    # maxl=max(width,height)

                    # x3=(int)(x+(width-maxl)*0.5)

                    # y3=(int)(y+(height-maxl)*0.5)

                    # x4=(int)(x3+maxl)

                    # y4=(int)(y3+maxl)

                    # cv2.rectangle(img,(x3,y3),(x4,y4),(255,0,0))

                else:

                    cv2.rectangle(showimg, (x, y), (x2, y2), (0, 0, 255))

            filename = filename.replace("/", "_")

            if len(bboxes) == 0:

                print ("warrning: no face")

                continue

            cv2.imwrite(imagesdir + "/" + filename, saveimg)

            if convet2yoloformat:

                height = saveimg.shape[0]

                width = saveimg.shape[1]

                txtpath = labelsdir + "/" + filename

                txtpath = txtpath[:-3] + "txt"

                ftxt = open(txtpath, 'w')

                for i in range(len(bboxes)):

                    bbox = bboxes[i]

                    xcenter = (bbox[0] + bbox[2] * 0.5) / width

                    ycenter = (bbox[1] + bbox[3] * 0.5) / height

                    wr = bbox[2] * 1.0 / width

                    hr = bbox[3] * 1.0 / height

                    txtline = "0 " + str(xcenter) + " " + str(ycenter) + " " + str(wr) + " " + str(hr) + "\n"

                    ftxt.write(txtline)

                ftxt.close()

            if convert2vocformat:

                xmlpath = vocannotationdir + "/" + filename

                xmlpath = xmlpath[:-3] + "xml"

                doc = Document()

                annotation = doc.createElement('annotation')

                doc.appendChild(annotation)

                folder = doc.createElement('folder')

                folder_name = doc.createTextNode('widerface')

                folder.appendChild(folder_name)

                annotation.appendChild(folder)

                filenamenode = doc.createElement('filename')

                filename_name = doc.createTextNode(filename)

                filenamenode.appendChild(filename_name)

                annotation.appendChild(filenamenode)

                source = doc.createElement('source')

                annotation.appendChild(source)

                database = doc.createElement('database')

                database.appendChild(doc.createTextNode('wider face Database'))

                source.appendChild(database)

                annotation_s = doc.createElement('annotation')

                annotation_s.appendChild(doc.createTextNode('PASCAL VOC2007'))

                source.appendChild(annotation_s)

                image = doc.createElement('image')

                image.appendChild(doc.createTextNode('flickr'))

                source.appendChild(image)

                flickrid = doc.createElement('flickrid')

                flickrid.appendChild(doc.createTextNode('-1'))

                source.appendChild(flickrid)

                owner = doc.createElement('owner')

                annotation.appendChild(owner)

                flickrid_o = doc.createElement('flickrid')

                flickrid_o.appendChild(doc.createTextNode('widerFace'))

                owner.appendChild(flickrid_o)

                name_o = doc.createElement('name')

                name_o.appendChild(doc.createTextNode('widerFace'))

                owner.appendChild(name_o)

                size = doc.createElement('size')

                annotation.appendChild(size)

                width = doc.createElement('width')

                width.appendChild(doc.createTextNode(str(saveimg.shape[1])))

                height = doc.createElement('height')

                height.appendChild(doc.createTextNode(str(saveimg.shape[0])))

                depth = doc.createElement('depth')

                depth.appendChild(doc.createTextNode(str(saveimg.shape[2])))

                size.appendChild(width)

                size.appendChild(height)

                size.appendChild(depth)

                segmented = doc.createElement('segmented')

                segmented.appendChild(doc.createTextNode(''))

                annotation.appendChild(segmented)

                for i in range(len(bboxes)):

                    bbox = bboxes[i]

                    objects = doc.createElement('object')

                    annotation.appendChild(objects)

                    object_name = doc.createElement('name')

                    object_name.appendChild(doc.createTextNode('face'))

                    objects.appendChild(object_name)

                    pose = doc.createElement('pose')

                    pose.appendChild(doc.createTextNode('Unspecified'))

                    objects.appendChild(pose)

                    truncated = doc.createElement('truncated')

                    truncated.appendChild(doc.createTextNode(''))

                    objects.appendChild(truncated)

                    difficult = doc.createElement('difficult')

                    difficult.appendChild(doc.createTextNode(''))

                    objects.appendChild(difficult)

                    bndbox = doc.createElement('bndbox')

                    objects.appendChild(bndbox)

                    xmin = doc.createElement('xmin')

                    xmin.appendChild(doc.createTextNode(str(bbox[0])))

                    bndbox.appendChild(xmin)

                    ymin = doc.createElement('ymin')

                    ymin.appendChild(doc.createTextNode(str(bbox[1])))

                    bndbox.appendChild(ymin)

                    xmax = doc.createElement('xmax')

                    xmax.appendChild(doc.createTextNode(str(bbox[0] + bbox[2])))

                    bndbox.appendChild(xmax)

                    ymax = doc.createElement('ymax')

                    ymax.appendChild(doc.createTextNode(str(bbox[1] + bbox[3])))

                    bndbox.appendChild(ymax)

                f = open(xmlpath, "w")

                f.write(doc.toprettyxml(indent=''))

                f.close()

                # cv2.imshow("img",showimg)

            # cv2.waitKey()

            index = index + 1

def generatetxt(img_set="train"):

    gtfilepath = rootdir + "/wider_face_split/wider_face_" + img_set + "_bbx_gt.txt"

    f = open(rootdir + "/" + img_set + ".txt", "w")

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            filename = filename.replace("/", "_")

            imgfilepath = datasetprefix + "/images/" + filename

            f.write(imgfilepath + '\n')

            numbbox = int(gtfile.readline())

            for i in range(numbbox):

                line = gtfile.readline()

    f.close()

def generatevocsets(img_set="train"):

    if not os.path.exists(rootdir + "/ImageSets"):

        os.mkdir(rootdir + "/ImageSets")

    if not os.path.exists(rootdir + "/ImageSets/Main"):

        os.mkdir(rootdir + "/ImageSets/Main")

    gtfilepath = rootdir + "/wider_face_split/wider_face_" + img_set + "_bbx_gt.txt"

    f = open(rootdir + "/ImageSets/Main/" + img_set + ".txt", 'w')

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            filename = filename.replace("/", "_")

            imgfilepath = filename[:-4]

            f.write(imgfilepath + '\n')

            numbbox = int(gtfile.readline())

            for i in range(numbbox):

                line = gtfile.readline()

    f.close()

def convertdataset():

    img_sets = ["train", "val"]

    for img_set in img_sets:

        convertimgset(img_set)

        generatetxt(img_set)

        generatevocsets(img_set)

if __name__ == "__main__":

    convertdataset()

    shutil.move(rootdir + "/" + "train.txt", rootdir + "/" + "trainval.txt")

    shutil.move(rootdir + "/" + "val.txt", rootdir + "/" + "test.txt")

    shutil.move(rootdir + "/ImageSets/Main/" + "train.txt", rootdir + "/ImageSets/Main/" + "trainval.txt")

    shutil.move(rootdir + "/ImageSets/Main/" + "val.txt", rootdir + "/ImageSets/Main/" + "test.txt")

widerface---VOC的更多相关文章

YOLO3训练widerface数据集
因为YOLO3速度精度都很棒,所以想训练一下人脸模型,废话不多,进入正题 1写所有的配置文件 1.1 YOLO3-face.cfg 个人感觉YOLO的配置文件骑士和caffe差不多在cfg/YOLO ...
Average Precision of VOC
转一篇文章,主要是关于VOC中Average Precision指标的原文出处:https://sanchom.wordpress.com/tag/average-precision/ 还有一篇文章 ...
搭建 MobileNet-SSD 开发环境并使用 VOC 数据集训练 TensorFlow 模型
原文地址:搭建 MobileNet-SSD 开发环境并使用 VOC 数据集训练 TensorFlow 模型 0x00 环境 OS: Ubuntu 1810 x64 Anaconda: 4.6.12 P ...
第三十二节，使用谷歌Object Detection API进行目标检测、训练新的模型(使用VOC 2012数据集)
前面已经介绍了几种经典的目标检测算法,光学习理论不实践的效果并不大,这里我们使用谷歌的开源框架来实现目标检测.至于为什么不去自己实现呢?主要是因为自己实现比较麻烦,而且调参比较麻烦,我们直接利用别人的 ...
VOC数据集生成代码使用说明
#split.py 文件输入格式为images ,和标签txt文件,txt中的数据为坐标值共8个. import os import numpy as np import math import c ...
在Ubuntu内制作自己的VOC数据集
一.VOC数据集的简介 PASCAL VOC为图像的识别和分类提供了一整套标准化的优秀数据集,基本上就是目标检测数据集的模板.现在有VOC2007,VOC2012.主要有20个类.而现在主要的模型评估 ...
Python生成PASCAL VOC格式的xml标注文件
Python生成PASCAL VOC格式的xml标注文件 PASCAL VOC数据集的标注文件是xml格式的.对于py-faster-rcnn,通常以下示例的字段是合适的: <annotatio ...
caffe生成voc格式lmdb
要训练ssd基本都是在liu wei框架下改,生成lmdb这一关照葫芦画瓢总遇坑,记录之: 1. labelmap_voc.prototxt要根据自己的分类修改,比如人脸检测改成这样: item { ...
PASCAL VOC数据集分析（转）
PASCAL VOC数据集分析 PASCAL VOC为图像识别和分类提供了一整套标准化的优秀的数据集,从2005年到2012年每年都会举行一场图像识别challenge. 本文主要分析PASCAL V ...
用python将MSCOCO和Caltech行人检测数据集转化成VOC格式
代码:转换用的代码放在这里之前用Tensorflow提供的object detection API可以很方便的进行fine-tuning实现所需的特定物体检测模型(看这里).那么现在的主要问题就是数 ...

随机推荐

Linux资源分析工具杂谈(长文慎入)
Linux资源分析工具杂谈开篇之前请大家先思考一个问题: 磁盘的平均I/O响应时间是1 ms,这个指标是好,还是差? 众所周知,计算机科学是客观的,也就是说对于一个给定的问题,我们总是 ...
pandas nan值处理
创建DataFrame样例数据 >>> import pandas as pd >>> import numpy as np >>> data = ...
Tableau 学习资料
官方文档: https://www.tableau.com/zh-cn/support/help 其他教程: tablaue破解版_tableau10 破解_tableau server 破解:htt ...
git 使用过程中遇到的问题does not appear to be a git repository Could not read from remote respository
想把本地的git库上传到github上.github已经新建了一个public仓库,利用网站的命令 git Bash报错:does not appear to be a git repository ...
c# 调用RDP和SSH实现远程登陆
1.ssh的登陆实现: windows平台可以安装OpenSSHforWindows 后,可以通过cmd 执行ssh的指令. 也可以在c#编程中实现ssh的登陆: var p = new System ...
flutter -webview 报错 err_cleartext_not_permitted
文件 android\app\src\main\AndroidManifest.xml <manifest xmlns:android="http://schemas.android. ...
rsync如何不指定密码文件
平时用rsync做数据同步时,都是通过--password-file指定一个密码文件这个密码文件权限要求比较高,一般是600,属主属组都是rsync命令执行者如果是在脚本中执行rsync,比如定时 ...
程序员面试题【前端，java，php】
跬步客网址:https://www.kuibuke.com/wall/index
VMware centos7 如何配置静态ip并且可上网
注:此贴使用NAT方式配置上网模式. 1.设置虚拟机的网络适配器为NAT模式: 2.修改VMware的“虚拟网络编辑器”: 打开后选择NAT模式,勾选,然后点击NAT设置: NAT默认设置了188网段 ...
快速安装 Laravel 5.7
$ git clone https://github.com/laravel/laravel.git $ cd laravel $ cp .env.example .env $ composer in ...

widerface---VOC

widerface---VOC的更多相关文章

随机推荐

热门专题