widerface数据库转voc2007数据集（python/matlab实现）

原作者: [db:作者] 来自: [db:来源] 收藏邀请

python实现基本需求，可以在此基础上修改

# -*- coding: utf-8 -*-
"""
Created on 17-5-27

@author: zly 
"""
from skimage import io
import shutil
import random
import os
import string

headstr = """\
<annotation>
    <folder>VOC2007</folder>
    <filename>%06d.jpg</filename>
    <source>
        <database>My Database</database>
        <annotation>PASCAL VOC2007</annotation>
        <image>flickr</image>
        <flickrid>NULL</flickrid>
    </source>
    <owner>
        <flickrid>NULL</flickrid>
        <name>company</name>
    </owner>
    <size>
        <width>%d</width>
        <height>%d</height>
        <depth>%d</depth>
    </size>
    <segmented>0</segmented>
"""
objstr = """\
    <object>
        <name>%s</name>
        <pose>Unspecified</pose>
        <truncated>0</truncated>
        <difficult>0</difficult>
        <bndbox>
            <xmin>%d</xmin>
            <ymin>%d</ymin>
            <xmax>%d</xmax>
            <ymax>%d</ymax>
        </bndbox>
    </object>
"""

tailstr = '''\
</annotation>
'''

def all_path(filename):
    return os.path.join('widerface', filename)

def writexml(idx, head, bbxes, tail):
    filename = all_path("Annotations/%06d.xml" % (idx))
    f = open(filename, "w")
    f.write(head)
    for bbx in bbxes:
        f.write(objstr % ('face', bbx[0], bbx[1], bbx[0] + bbx[2], bbx[1] + bbx[3]))
    f.write(tail)
    f.close()


def clear_dir():
    if shutil.os.path.exists(all_path('Annotations')):
        shutil.rmtree(all_path('Annotations'))
    if shutil.os.path.exists(all_path('ImageSets')):
        shutil.rmtree(all_path('ImageSets'))
    if shutil.os.path.exists(all_path('JPEGImages')):
        shutil.rmtree(all_path('JPEGImages'))

    shutil.os.mkdir(all_path('Annotations'))
    shutil.os.makedirs(all_path('ImageSets/Main'))
    shutil.os.mkdir(all_path('JPEGImages'))


def excute_datasets(idx, datatype):
    f = open(all_path('ImageSets/Main/' + datatype + '.txt'), 'a')
    f_bbx = open(all_path('wider_face_split/wider_face_' + datatype + '_bbx_gt.txt'), 'r')

    while True:
        filename = string.strip(f_bbx.readline(), '\n')
        if not filename:
            break
        im = io.imread(all_path('WIDER_' + datatype + '/images/'+filename))
        head = headstr % (idx, im.shape[1], im.shape[0], im.shape[2])
        nums = string.strip(f_bbx.readline(), '\n')
        bbxes = []
        for ind in xrange(string.atoi(nums)):
            bbx_info = string.split(string.strip(f_bbx.readline(), ' \n'), ' ')
            bbx = [string.atoi(bbx_info[i]) for i in range(len(bbx_info))]
            #x1, y1, w, h, blur, expression, illumination, invalid, occlusion, pose
            if bbx[7]==0:
                bbxes.append(bbx)
        writexml(idx, head, bbxes, tailstr)
        shutil.copyfile(all_path('WIDER_' + datatype + '/images/'+filename), all_path('JPEGImages/%06d.jpg' % (idx)))
        f.write('%06d\n' % (idx))
        idx +=1
    f.close()
    f_bbx.close()
    return idx


# 打乱样本
def shuffle_file(filename):
    f = open(filename, 'r+')
    lines = f.readlines()
    random.shuffle(lines)
    f.seek(0)
    f.truncate()
    f.writelines(lines)
    f.close()


if __name__ == '__main__':
    clear_dir()
    idx = 1
    idx = excute_datasets(idx, 'train')
    idx = excute_datasets(idx, 'val')

目录结构如下

以下python代码为读取mat，废弃，仅供学习

import h5py
from skimage import io
import shutil
import random

headstr = """\
<annotation>
    <folder>VOC2007</folder>
    <filename>%06d.jpg</filename>
    <source>
        <database>My Database</database>
        <annotation>PASCAL VOC2007</annotation>
        <image>flickr</image>
        <flickrid>NULL</flickrid>
    </source>
    <owner>
        <flickrid>NULL</flickrid>
        <name>facevise</name>
    </owner>
    <size>
        <width>%d</width>
        <height>%d</height>
        <depth>%d</depth>
    </size>
    <segmented>0</segmented>
"""
objstr = """\
    <object>
        <name>%s</name>
        <pose>Unspecified</pose>
        <truncated>0</truncated>
        <difficult>0</difficult>
        <bndbox>
            <xmin>%d</xmin>
            <ymin>%d</ymin>
            <xmax>%d</xmax>
            <ymax>%d</ymax>
        </bndbox>
    </object>
"""

tailstr ='''\
</annotation>
'''
def writexml(idx, head, objs, tail):
    filename = "Annotations/%06d.xml" % (idx)
    f = open(filename, "w")
    f.write(head)
    f.write(objs)
    f.write(tail)
    f.close()
    
def clear_dir():
    if shutil.os.path.exists('Annotations'):
        shutil.rmtree('Annotations')
    if shutil.os.path.exists('ImageSets'):
        shutil.rmtree('ImageSets')
    if shutil.os.path.exists('JPEGImages'):
        shutil.rmtree('JPEGImages')
    
    shutil.os.mkdir('Annotations')
    shutil.os.makedirs('ImageSets/Main')
    shutil.os.mkdir('JPEGImages')
    
def excute_datasets(idx, datatype):
    f = open('ImageSets/Main/'+datatype+'.txt', 'a')
    mat = h5py.File('wider_face_split/wider_face_'+datatype+'.mat', 'r')
    file_list = mat['file_list'][:]
    event_list = mat['event_list'][:]
    bbx_list = mat['face_bbx_list'][:]
    for i in range(file_list.size):        
        file_list_sub = mat[file_list[0,i]][:]
        bbx_list_sub = mat[bbx_list[0, i]][:]
        event_value = ''.join(chr(x) for x in mat[event_list[0,i]][:])
        for j in range(file_list_sub.size):
            root = 'WIDER_'+datatype+'/images/'+event_value+'/'
            filename = root + ''.join([chr(x) for x in mat[file_list_sub[0, j]][:]])+'.jpg'
            im = io.imread(filename)
            head = headstr % (idx, im.shape[1], im.shape[0], im.shape[2])            
            bboxes = mat[bbx_list_sub[0, j]][:]
            objs = ''.join([objstr % ('face', \
                   bboxes[0,k],bboxes[1,k], bboxes[0,k]+bboxes[2,k]-1,bboxes[1,k]+bboxes[3,k]-1) \
                   for k in range(bboxes.shape[1])])
            writexml(idx, head, objs, tailstr)
            shutil.copyfile(filename, 'JPEGImages/%06d.jpg' % (idx))
            f.write('%06d\n' % (idx))
            idx +=1
    f.close()   
    return idx
#打乱样本    
def shuffle_file(filename):
    f = open(filename, 'r+')
    lines = f.readlines()
    random.shuffle(lines)
    f.seek(0)
    f.truncate()
    f.writelines(lines)
    f.close()
            
if __name__ == '__main__':
    clear_dir()
    idx = 1
    idx = excute_datasets(idx, 'train')
    idx = excute_datasets(idx, 'val')

matlab实现

head.xml

<annotation>
    <folder>widerface</folder>
    <filename>%06d.jpg</filename>
    <source>
        <database>My Database</database>
        <annotation>VOC2007</annotation>
        <image>flickr</image>
        <flickrid>NULL</flickrid>
    </source>
    <owner>
        <flickrid>NULL</flickrid>
        <name>facevise</name>
    </owner>
    <size>
        <width>%d</width>
        <height>%d</height>
        <depth>%d</depth>
    </size>
    <segmented>0</segmented>

object.xml

    <object>
        <name>%s</name>
        <pose>Unspecified</pose>
        <truncated>0</truncated>
        <difficult>0</difficult>
        <bndbox>
            <xmin>%d</xmin>
            <ymin>%d</ymin>
            <xmax>%d</xmax>
            <ymax>%d</ymax>
        </bndbox>
    </object>

tail.xml

</annotation>

function WiderFace2VOC()
%% wider face
% The corresponding annotations are in the following format:
% Here, each face bounding boxe is denoted by:
% <x_left y_top width height>.

%% voc
% 000001.jpg car 44 28 132 121  
%前面是图片名，中间是目标类别，最后是目标的包围框坐标（左上角和右下角坐标）。

%% 
clc;
clear;
fclose all;
[~, ~, ~] = rmdir('Annotations', 's');
[~, ~, ~] = rmdir('ImageSets', 's');
[~, ~, ~] = rmdir('JPEGImages', 's');

[~, ~, ~] = mkdir('Annotations');
[~, ~, ~] = mkdir('ImageSets/Main');
[~, ~, ~] = mkdir('JPEGImages');

train_root = 'WIDER_train/images';
split_file = 'wider_face_split/wider_face_train';
data = load(split_file);

headXml = fopen('head.xml', 'r');
headXmlFormat = fread(headXml, Inf, '*char');
fclose(headXml);

objectXml = fopen('object.xml', 'r');
objectXmlFormat = fread(objectXml, Inf, '*char');
fclose(objectXml);

tailXml = fopen('tail.xml', 'r');
tailXmlFormat = fread(tailXml, Inf, '*char');
fclose(tailXml);

trainID =  fopen('ImageSets/Main/train.txt', 'w');
trainvalID =  fopen('ImageSets/Main/trainval.txt', 'w');
valID =  fopen('ImageSets/Main/val.txt', 'w');
testID =  fopen('ImageSets/Main/test.txt', 'w');

idx = 1;
for i=1:numel(data.event_list)
    for j=1:numel(data.file_list{i})
        imagename = fullfile(train_root, data.event_list{i}, strcat(data.file_list{i}{j}, '.jpg'));
        sz = size(imread(imagename));
        AnnotationsXml = fopen(sprintf('Annotations/%06d.xml', idx), 'w');
        fprintf(AnnotationsXml, headXmlFormat, idx, sz(2), sz(1),sz(3));
        for k = 1:size(data.face_bbx_list{i}{j}, 1)
            rc = data.face_bbx_list{i}{j}(k, :);
            rc = round([rc(1), rc(2), rc(1)+rc(3)-1, rc(2)+rc(4)-1]);
            fprintf(AnnotationsXml, objectXmlFormat, 'face', rc(1), rc(2), rc(3), rc(4));
        end
        fprintf(AnnotationsXml, tailXmlFormat);
        fprintf(trainID, '%06d\n', idx);
        fprintf(trainvalID, '%06d\n', idx);
        fclose(AnnotationsXml);
        copyfile(imagename, sprintf('JPEGImages/%06d.jpg', idx));
        idx = idx + 1;
    end  
    disp(i);
end

train_root = 'WIDER_val/images';
split_file = 'wider_face_split/wider_face_val';
data = load(split_file);

for i=1:numel(data.event_list)
    for j=1:numel(data.file_list{i})
        imagename = fullfile(train_root, data.event_list{i}, strcat(data.file_list{i}{j}, '.jpg'));
        sz = size(imread(imagename));
        AnnotationsXml = fopen(sprintf('Annotations/%06d.xml', idx), 'w');
        fprintf(AnnotationsXml, headXmlFormat, idx, sz(2), sz(1),sz(3));
        for k = 1:size(data.face_bbx_list{i}{j}, 1)
            rc = data.face_bbx_list{i}{j}(k, :);
            rc = round([rc(1), rc(2), rc(1)+rc(3)-1, rc(2)+rc(4)-1]);
            fprintf(AnnotationsXml, objectXmlFormat, 'face', rc(1), rc(2), rc(3), rc(4));
        end
        fprintf(AnnotationsXml, tailXmlFormat);
        if mod(idx, 2)
            fprintf(valID, '%06d\n', idx);
            fprintf(trainvalID, '%06d\n', idx);
        else
            fprintf(testID, '%06d\n', idx);
        end
        fclose(AnnotationsXml);
        copyfile(imagename, sprintf('JPEGImages/%06d.jpg', idx));
        idx = idx+1;
    end        
    disp(i);
end
fclose(trainID);
fclose(trainvalID);
fclose(valID);
fclose(testID);
fclose all;

鲜花

握手

雷人

路过

鸡蛋

该文章已有0人参与评论

请发表评论

全部评论

专题导读

More+

10-27 六六分期app的软件客服如何联系？(六六分期

11-06 可心卡盟:win10系统火狐flash插件崩溃怎么

11-06 亲亲特价:怎么删除回收站图标

11-06 济南大学虚拟社区:鲁大师节能降温的具体办

11-06 xlueops.exe:无线网络安装向导

11-06 女斗合众国:win7系统cf与主机连接不稳定怎

11-06 0xc000022-[cf烟雾头]cf怎么调烟雾头

11-06 qizideyouhuo:应用程序无法正常启动0xc0000

11-06 ipz-185:win7系统vcf文件怎么打开

11-06 傻哥蹦迪:win10系统s4怎么打开usb调试

11-06 八神浩树gtaste:回收站清空了怎么恢复

11-06 妖尾之黑色守护:win10系统电脑没有1440x900

11-06 校园至尊魔王小说:win7系统浏览网页时字体

11-06 女斗合众国:win10系统访问共享文件夹提示请

11-06 tokyo hot n0654:恢复win7系统默认字体一招

11-06 雨酷仙境:设置win7系统转移临时文件夹腾出

11-06 阿穆纳伊之杖:win7系统开始菜单在右边还原

11-06 tunespotting:win10系统火狐flash插件总是

11-06 甘尔葛分析师：计谋网站seo关键词暴涨有什

11-06 蔡贵霖: 计谋网站seo关键词暴涨有什么秘密

11-06 博益网首页:ao3网页版进入不了解决方法

11-06 漏斗子专栏: 网站数据分析小白易懂精华篇

11-06 见证双虹怎么做:win7系统开启telnet命令的

11-06 颾狐蝶蜋:系统资源不足无法完成请求的服务

11-06 国光中学校歌:提交网站到alexa查询详细步骤

11-06 西安有情天:静态网页和动态网页的区别

11-06 红木雅尚斋:外部链接构造对网站的好处

11-06 前官礼遇：防止域名劫持–增强域安全性的10

11-06 密传二转答案: 中文分词算法有哪些

11-06 金泉家园邮编:百度快照劫持的表现及应对方

Delphi Firemonkey Button ImageList发布时间：2022-07-18

Delphi web应用开发框架 - 第二部发布时间：2022-07-18

剪的笔顺,诠释剪的笔画,认识剪的部首

六六分期app的软件客服如何联系？(六六分期

2023-10-27

florent37/ViewAnimator: A fluent Android

2022-08-15

florent37/Shrine-MaterialDesign2: implem

2022-08-17

CVE-2020-36276

2022-09-23

SimpleSoftwareIO/simple-sms: Send and re

2022-08-13

阅读排行榜

1 六六分期app的软件客服如何联系？(六六分期

六六分期app的软件客服如何联系？不知道吗？加qq群【895510560】即可！标题：六六分期

阅读：19166|2023-10-27

2 可心卡盟:win10系统火狐flash插件崩溃怎么

今天小编告诉大家如何处理win10系统火狐flash插件总是崩溃的问题，可能很多用户都不知

阅读：9981|2022-11-06

3 亲亲特价:怎么删除回收站图标

今天小编告诉大家如何对win10系统删除桌面回收站图标进行设置，可能很多用户都不知道

阅读：8321|2022-11-06

4 济南大学虚拟社区:鲁大师节能降温的具体办

今天小编告诉大家如何对win10系统电脑设置节能降温的设置方法，想必大家都遇到过需要

阅读：8690|2022-11-06

5 xlueops.exe:无线网络安装向导

我们在使用xp系统的过程中,经常需要对xp系统无线网络安装向导设置进行设置，可能很多

阅读：8634|2022-11-06

6 女斗合众国:win7系统cf与主机连接不稳定怎

今天小编告诉大家如何处理win7系统玩cf老是与主机连接不稳定的问题，可能很多用户都不

阅读：9650|2022-11-06

7 0xc000022-[cf烟雾头]cf怎么调烟雾头

电脑对日常生活的重要性小编就不多说了，可是一旦碰到win7系统设置cf烟雾头的问题，很

阅读：8617|2022-11-06

8 qizideyouhuo:应用程序无法正常启动0xc0000

我们在日常使用电脑的时候，有的小伙伴们可能在打开应用的时候会遇见提示应用程序无法

阅读：7994|2022-11-06

9 ipz-185:win7系统vcf文件怎么打开

今天小编告诉大家如何对win7系统打开vcf文件进行设置，可能很多用户都不知道怎么对win

阅读：8648|2022-11-06

10 傻哥蹦迪:win10系统s4怎么打开usb调试

今天小编告诉大家如何对win10系统s4开启USB调试模式进行设置，可能很多用户都不知道怎

阅读：7531|2022-11-06

客服电话

电子邮件

widerface数据库转voc2007数据集（python/matlab实现）

请发表评论

全部评论

上一篇：

下一篇：

bluegill/katana:

OpenNBS/OpenNoteBlockStudio: An open-sou

juleswhite/mobilecloud-15: Programming C

JunichiT/JTMaterialSwitch: A Customizabl

delphi 数据导出进度条自己生成

剪的笔顺,诠释剪的笔画,认识剪的部首

六六分期app的软件客服如何联系？(六六分期

florent37/ViewAnimator: A fluent Android

florent37/Shrine-MaterialDesign2: implem

CVE-2020-36276

SimpleSoftwareIO/simple-sms: Send and re

关于我们

产品与服务

解决方案

139-2527-9053

客服电话

电子邮件

widerface数据库转voc2007数据集（python/matlab实现）

请发表评论

全部评论

上一篇：

下一篇：

bluegill/katana:

OpenNBS/OpenNoteBlockStudio: An open-sou

juleswhite/mobilecloud-15: Programming C

JunichiT/JTMaterialSwitch: A Customizabl

delphi 数据导出 进度条自己生成

剪的笔顺,诠释剪的笔画,认识剪的部首

六六分期app的软件客服如何联系？(六六分期

florent37/ViewAnimator: A fluent Android

florent37/Shrine-MaterialDesign2: implem

CVE-2020-36276

SimpleSoftwareIO/simple-sms: Send and re

关于我们

产品与服务

解决方案

139-2527-9053

delphi 数据导出进度条自己生成