widerface---VOC

import os, h5py, cv2, sys, shutil

import numpy as np

from xml.dom.minidom import Document

rootdir = "G:/MTCNNTraining/faceData/widerFace"

convet2yoloformat = True

convert2vocformat = True

resized_dim = (48, 48)

# 最小取1大小的脸，并且补齐

minsize2select = 1

usepadding = True

datasetprefix = "G:/MTCNNTraining/faceData/widerFace"  #

def gen_hdf5():

    imgdir = rootdir + "/WIDER_train/images"

    gtfilepath = rootdir + "/wider_face_split/wider_face_train_bbx_gt.txt"

    index = 0

    with open(gtfilepath, 'r') as gtfile:

        faces = []

        labels = []

        while (True):  # and len(faces)<10

            imgpath = gtfile.readline()[:-1]

            if (imgpath == ""):

                break

            print (index, imgpath)

            img = cv2.imread(imgdir + "/" + imgpath)

            numbbox = int(gtfile.readline())

            bbox = []

            for i in range(numbbox):

                line = gtfile.readline()

                line = line.split()

                line = line[0:4]

                if (int(line[3]) <= 0 or int(line[2]) <= 0):

                    continue

                bbox = (int(line[0]), int(line[1]), int(line[2]), int(line[3]))

                face = img[int(line[1]):int(line[1]) + int(line[3]), int(line[0]):int(line[0]) + int(line[2])]

                face = cv2.resize(face, resized_dim)

                faces.append(face)

                labels.append(1)

                cv2.rectangle(img, (int(line[0]), int(line[1])),

                              (int(line[0]) + int(line[2]), int(line[1]) + int(line[3])), (255, 0, 0))

            # cv2.imshow("img",img)

            # cv2.waitKey(1)

            index = index + 1

        faces = np.asarray(faces)

        labels = np.asarray(labels)

        f = h5py.File('train.h5', 'w')

        f['data'] = faces.astype(np.float32)

        f['label'] = labels.astype(np.float32)

        f.close()

def viewginhdf5():

    f = h5py.File('train.h5', 'r')

    f.keys()

    faces = f['data'][:]

    for face in faces:

        face = face.astype(np.uint8)

        cv2.imshow("img", face)

        cv2.waitKey(1)

    f.close()

def convertimgset(img_set="train"):

    imgdir = rootdir + "/WIDER_" + img_set + "/images"

    gtfilepath = rootdir + "/wider_face_split/wider_face_" + img_set + "_bbx_gt.txt"

    imagesdir = rootdir + "/images"

    vocannotationdir = rootdir + "/Annotations"

    labelsdir = rootdir + "/labels"

    if not os.path.exists(imagesdir):

        os.mkdir(imagesdir)

    if convet2yoloformat:

        if not os.path.exists(labelsdir):

            os.mkdir(labelsdir)

    if convert2vocformat:

        if not os.path.exists(vocannotationdir):

            os.mkdir(vocannotationdir)

    index = 0

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            sys.stdout.write("\r" + str(index) + ":" + filename + "\t\t\t")

            sys.stdout.flush()

            imgpath = imgdir + "/" + filename

            img = cv2.imread(imgpath)

            if not img.data:

                break

            imgheight = img.shape[0]

            imgwidth = img.shape[1]

            maxl = max(imgheight, imgwidth)

            paddingleft = (maxl - imgwidth) >> 1

            paddingright = (maxl - imgwidth) >> 1

            paddingbottom = (maxl - imgheight) >> 1

            paddingtop = (maxl - imgheight) >> 1

            saveimg = cv2.copyMakeBorder(img, paddingtop, paddingbottom, paddingleft, paddingright, cv2.BORDER_CONSTANT,value=0)

            showimg = saveimg.copy()

            numbbox = int(gtfile.readline())

            bboxes = []

            for i in range(numbbox):

                line = gtfile.readline()

                line = line.split()

                line = line[0:4]

                if (int(line[3]) <= 0 or int(line[2]) <= 0):

                    continue

                x = int(line[0]) + paddingleft

                y = int(line[1]) + paddingtop

                width = int(line[2])

                height = int(line[3])

                bbox = (x, y, width, height)

                x2 = x + width

                y2 = y + height

                # face=img[x:x2,y:y2]

                if width >= minsize2select and height >= minsize2select:

                    bboxes.append(bbox)

                    cv2.rectangle(showimg, (x, y), (x2, y2), (0, 255, 0))

                    # maxl=max(width,height)

                    # x3=(int)(x+(width-maxl)*0.5)

                    # y3=(int)(y+(height-maxl)*0.5)

                    # x4=(int)(x3+maxl)

                    # y4=(int)(y3+maxl)

                    # cv2.rectangle(img,(x3,y3),(x4,y4),(255,0,0))

                else:

                    cv2.rectangle(showimg, (x, y), (x2, y2), (0, 0, 255))

            filename = filename.replace("/", "_")

            if len(bboxes) == 0:

                print ("warrning: no face")

                continue

            cv2.imwrite(imagesdir + "/" + filename, saveimg)

            if convet2yoloformat:

                height = saveimg.shape[0]

                width = saveimg.shape[1]

                txtpath = labelsdir + "/" + filename

                txtpath = txtpath[:-3] + "txt"

                ftxt = open(txtpath, 'w')

                for i in range(len(bboxes)):

                    bbox = bboxes[i]

                    xcenter = (bbox[0] + bbox[2] * 0.5) / width

                    ycenter = (bbox[1] + bbox[3] * 0.5) / height

                    wr = bbox[2] * 1.0 / width

                    hr = bbox[3] * 1.0 / height

                    txtline = "0 " + str(xcenter) + " " + str(ycenter) + " " + str(wr) + " " + str(hr) + "\n"

                    ftxt.write(txtline)

                ftxt.close()

            if convert2vocformat:

                xmlpath = vocannotationdir + "/" + filename

                xmlpath = xmlpath[:-3] + "xml"

                doc = Document()

                annotation = doc.createElement('annotation')

                doc.appendChild(annotation)

                folder = doc.createElement('folder')

                folder_name = doc.createTextNode('widerface')

                folder.appendChild(folder_name)

                annotation.appendChild(folder)

                filenamenode = doc.createElement('filename')

                filename_name = doc.createTextNode(filename)

                filenamenode.appendChild(filename_name)

                annotation.appendChild(filenamenode)

                source = doc.createElement('source')

                annotation.appendChild(source)

                database = doc.createElement('database')

                database.appendChild(doc.createTextNode('wider face Database'))

                source.appendChild(database)

                annotation_s = doc.createElement('annotation')

                annotation_s.appendChild(doc.createTextNode('PASCAL VOC2007'))

                source.appendChild(annotation_s)

                image = doc.createElement('image')

                image.appendChild(doc.createTextNode('flickr'))

                source.appendChild(image)

                flickrid = doc.createElement('flickrid')

                flickrid.appendChild(doc.createTextNode('-1'))

                source.appendChild(flickrid)

                owner = doc.createElement('owner')

                annotation.appendChild(owner)

                flickrid_o = doc.createElement('flickrid')

                flickrid_o.appendChild(doc.createTextNode('widerFace'))

                owner.appendChild(flickrid_o)

                name_o = doc.createElement('name')

                name_o.appendChild(doc.createTextNode('widerFace'))

                owner.appendChild(name_o)

                size = doc.createElement('size')

                annotation.appendChild(size)

                width = doc.createElement('width')

                width.appendChild(doc.createTextNode(str(saveimg.shape[1])))

                height = doc.createElement('height')

                height.appendChild(doc.createTextNode(str(saveimg.shape[0])))

                depth = doc.createElement('depth')

                depth.appendChild(doc.createTextNode(str(saveimg.shape[2])))

                size.appendChild(width)

                size.appendChild(height)

                size.appendChild(depth)

                segmented = doc.createElement('segmented')

                segmented.appendChild(doc.createTextNode(''))

                annotation.appendChild(segmented)

                for i in range(len(bboxes)):

                    bbox = bboxes[i]

                    objects = doc.createElement('object')

                    annotation.appendChild(objects)

                    object_name = doc.createElement('name')

                    object_name.appendChild(doc.createTextNode('face'))

                    objects.appendChild(object_name)

                    pose = doc.createElement('pose')

                    pose.appendChild(doc.createTextNode('Unspecified'))

                    objects.appendChild(pose)

                    truncated = doc.createElement('truncated')

                    truncated.appendChild(doc.createTextNode(''))

                    objects.appendChild(truncated)

                    difficult = doc.createElement('difficult')

                    difficult.appendChild(doc.createTextNode(''))

                    objects.appendChild(difficult)

                    bndbox = doc.createElement('bndbox')

                    objects.appendChild(bndbox)

                    xmin = doc.createElement('xmin')

                    xmin.appendChild(doc.createTextNode(str(bbox[0])))

                    bndbox.appendChild(xmin)

                    ymin = doc.createElement('ymin')

                    ymin.appendChild(doc.createTextNode(str(bbox[1])))

                    bndbox.appendChild(ymin)

                    xmax = doc.createElement('xmax')

                    xmax.appendChild(doc.createTextNode(str(bbox[0] + bbox[2])))

                    bndbox.appendChild(xmax)

                    ymax = doc.createElement('ymax')

                    ymax.appendChild(doc.createTextNode(str(bbox[1] + bbox[3])))

                    bndbox.appendChild(ymax)

                f = open(xmlpath, "w")

                f.write(doc.toprettyxml(indent=''))

                f.close()

                # cv2.imshow("img",showimg)

            # cv2.waitKey()

            index = index + 1

def generatetxt(img_set="train"):

    gtfilepath = rootdir + "/wider_face_split/wider_face_" + img_set + "_bbx_gt.txt"

    f = open(rootdir + "/" + img_set + ".txt", "w")

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            filename = filename.replace("/", "_")

            imgfilepath = datasetprefix + "/images/" + filename

            f.write(imgfilepath + '\n')

            numbbox = int(gtfile.readline())

            for i in range(numbbox):

                line = gtfile.readline()

    f.close()

def generatevocsets(img_set="train"):

    if not os.path.exists(rootdir + "/ImageSets"):

        os.mkdir(rootdir + "/ImageSets")

    if not os.path.exists(rootdir + "/ImageSets/Main"):

        os.mkdir(rootdir + "/ImageSets/Main")

    gtfilepath = rootdir + "/wider_face_split/wider_face_" + img_set + "_bbx_gt.txt"

    f = open(rootdir + "/ImageSets/Main/" + img_set + ".txt", 'w')

    with open(gtfilepath, 'r') as gtfile:

        while (True):  # and len(faces)<10

            filename = gtfile.readline()[:-1]

            if (filename == ""):

                break

            filename = filename.replace("/", "_")

            imgfilepath = filename[:-4]

            f.write(imgfilepath + '\n')

            numbbox = int(gtfile.readline())

            for i in range(numbbox):

                line = gtfile.readline()

    f.close()

def convertdataset():

    img_sets = ["train", "val"]

    for img_set in img_sets:

        convertimgset(img_set)

        generatetxt(img_set)

        generatevocsets(img_set)

if __name__ == "__main__":

    convertdataset()

    shutil.move(rootdir + "/" + "train.txt", rootdir + "/" + "trainval.txt")

    shutil.move(rootdir + "/" + "val.txt", rootdir + "/" + "test.txt")

    shutil.move(rootdir + "/ImageSets/Main/" + "train.txt", rootdir + "/ImageSets/Main/" + "trainval.txt")

    shutil.move(rootdir + "/ImageSets/Main/" + "val.txt", rootdir + "/ImageSets/Main/" + "test.txt")

widerface---VOC的更多相关文章

YOLO3训练widerface数据集
因为YOLO3速度精度都很棒,所以想训练一下人脸模型,废话不多,进入正题 1写所有的配置文件 1.1 YOLO3-face.cfg 个人感觉YOLO的配置文件骑士和caffe差不多在cfg/YOLO ...
Average Precision of VOC
转一篇文章,主要是关于VOC中Average Precision指标的原文出处:https://sanchom.wordpress.com/tag/average-precision/ 还有一篇文章 ...
搭建 MobileNet-SSD 开发环境并使用 VOC 数据集训练 TensorFlow 模型
原文地址:搭建 MobileNet-SSD 开发环境并使用 VOC 数据集训练 TensorFlow 模型 0x00 环境 OS: Ubuntu 1810 x64 Anaconda: 4.6.12 P ...
第三十二节，使用谷歌Object Detection API进行目标检测、训练新的模型(使用VOC 2012数据集)
前面已经介绍了几种经典的目标检测算法,光学习理论不实践的效果并不大,这里我们使用谷歌的开源框架来实现目标检测.至于为什么不去自己实现呢?主要是因为自己实现比较麻烦,而且调参比较麻烦,我们直接利用别人的 ...
VOC数据集生成代码使用说明
#split.py 文件输入格式为images ,和标签txt文件,txt中的数据为坐标值共8个. import os import numpy as np import math import c ...
在Ubuntu内制作自己的VOC数据集
一.VOC数据集的简介 PASCAL VOC为图像的识别和分类提供了一整套标准化的优秀数据集,基本上就是目标检测数据集的模板.现在有VOC2007,VOC2012.主要有20个类.而现在主要的模型评估 ...
Python生成PASCAL VOC格式的xml标注文件
Python生成PASCAL VOC格式的xml标注文件 PASCAL VOC数据集的标注文件是xml格式的.对于py-faster-rcnn,通常以下示例的字段是合适的: <annotatio ...
caffe生成voc格式lmdb
要训练ssd基本都是在liu wei框架下改,生成lmdb这一关照葫芦画瓢总遇坑,记录之: 1. labelmap_voc.prototxt要根据自己的分类修改,比如人脸检测改成这样: item { ...
PASCAL VOC数据集分析（转）
PASCAL VOC数据集分析 PASCAL VOC为图像识别和分类提供了一整套标准化的优秀的数据集,从2005年到2012年每年都会举行一场图像识别challenge. 本文主要分析PASCAL V ...
用python将MSCOCO和Caltech行人检测数据集转化成VOC格式
代码:转换用的代码放在这里之前用Tensorflow提供的object detection API可以很方便的进行fine-tuning实现所需的特定物体检测模型(看这里).那么现在的主要问题就是数 ...

随机推荐

spider随机请求头和ip
#创建爬虫 scrapy genspider randomIp_spider "taobao.com" #把需要请求的url放到一个混淆的url请求list中去,避免被监测到总是访 ...
powerdesigner的PDM模型name和comment相互复制替换
在[Tools]-[Execute Commands]-[Edit/Run Script] 下.输入以下命令,这些命令也可以保存起来,扩展名为 vbs ,以便下次使用. 1.name的值复制到comm ...
最新阿里云申请免费SSL证书实现网站HTTPS化（图文教程一）
一.申请免费SSL证书: 1.登录阿里云: 2.领取代金券礼包: https://promotion.aliyun.com/ntms/yunparter/invite.html?userCode=0a ...
灵雀云获邀加入CDF（持续交付基金会），成为中国区三大创始成员之一
3月12日,在加州Half Moon Bay举行的开源领导者峰会(Open Leadership Summit 2019 )上,CDF(Continuous Delivery Foundation ) ...
asp.net 去掉小数点后面多余的0
很多时候,比如gridview内,不想现实从数据库带出的多余小数 ,比如 4.01000. 那就可以做一个函数: /// <summary> /// 去掉小数点后多余的0, 0本身显示为0 ...
31 Python中 sys.argv[]的用法简明解释（转）
Python中 sys.argv[]的用法简明解释因为是看书自学的python,开始后不久就遇到了这个引入的模块函数,且一直在IDLE上编辑了后运行,试图从结果发现它的用途,然而结果一直都是没结果, ...
calss 类
class Role(object): n = 123 # 类变量,像__init__中life_value,money默认参数用类变量,如果多个类的实例那就节省了内存,类变量只在类中存一份,实例中不 ...
JVM探秘6--图解虚拟机栈的局部变量表和操作数栈工作流程
案例代码如下: public class JVMTest { public static Integer num = 10; public int add(int i){ int j = 5; int ...
vm中的nat模式不能连接到主机，以及不能上网
主机能够ping通vm中的ip,但是vm不能ping通主机ip vm不能ping通主机:主要是虚拟机中的gateway的设置和vm的网络编辑器中的网关id不一致造成的 vm不能上外网:dns没有配置正 ...
js中的排序方法
一.冒泡排序 var arr=[22,1,33,19,77]; function bubbleSort(arr){ for(var i=0;i<arr.length-1;i++){ for( ...

widerface---VOC

widerface---VOC的更多相关文章

随机推荐

热门专题