制作自己的ILSVRC2015 VID数据集的一些脚本以及流程

前言:刚开始做视频目标检测的时候需要把我们实验室的医疗数据制作成ILSVRC2015 VID这样格式的数据,但是在网上没怎么找到攻略,故把自己的一些经验记录下来。

1、json转xml:由labelme这个软件标注出来的数据集一般都是json格式的,需要把json标注格式转化成xml格式。

import os
 
from typing import List, Any
 
 
 
import numpy as np
 
import codecs
 
import json
 
from glob import glob
 
import cv2
 
import shutil
 
from sklearn.model_selection import train_test_split
 
# 1.标签路径
 
path = "/media/work/data/lx/mega_data/tempdatas/train"              #原始labelme标注数据路径
saved_path = "/media/work/data/lx/mega_data/val_train/"                #保存路径
 
 
 
    # 3.获取待处理文件

for tt in os.listdir(path):
    labelme_path='/media/work/data/lx/mega_data/tempdatas/train'+'/'+tt+'/'
    cont=os.listdir(labelme_path)
    if len(cont)<20:
        continue
    print(labelme_path)
    files = glob(labelme_path + "*.json")
    #print(files)
    files = [i.replace("\\","/").split("/")[-1].split(".json")[0] for i in files]
    
    print(files)
    
    # 4.读取标注信息并写入 xml
    
    for json_file_ in files:
    
        json_filename = labelme_path + json_file_ + ".json"
    
        json_file = json.load(open(json_filename, "r", encoding="utf-8"))
    
        height, width, channels = cv2.imread(labelme_path + json_file_ + ".JPEG").shape

        temp=saved_path+ "/"+ "Annotations/"+"VID/"+"train/"+tt
        if not os.path.exists(temp):
           os.makedirs(temp)
    
        with codecs.open(temp+"/"+ json_file_ + ".xml", "w", "utf-8") as xml:
    
            xml.write('\n')
    
            xml.write('\t' + 'WH_data' + '\n')
    
            xml.write('\t' + json_file_ + ".JPEG" + '\n')
    
            xml.write('\t\n')
    
            xml.write('\t\tWH Data\n')
    
            xml.write('\t\tWH\n')
    
            xml.write('\t\tflickr\n')
    
            xml.write('\t\tNULL\n')
    
            xml.write('\t\n')
    
            xml.write('\t\n')
    
            xml.write('\t\tNULL\n')
    
            xml.write('\t\tWH\n')
    
            xml.write('\t\n')
    
            xml.write('\t\n')
    
            xml.write('\t\t' + str(width) + '\n')
    
            xml.write('\t\t' + str(height) + '\n')
    
            xml.write('\t\t' + str(channels) + '\n')
    
            xml.write('\t\n')
    
            xml.write('\t\t0\n')
    
            for multi in json_file["shapes"]:
    
                points = np.array(multi["points"])
    
                labelName=multi["label"]
    
                xmin = min(points[:, 0])
    
                xmax = max(points[:, 0])
    
                ymin = min(points[:, 1])
    
                ymax = max(points[:, 1])
    
                label = multi["label"]
    
                if xmax <= xmin:
    
                    pass
    
                elif ymax <= ymin:
    
                    pass
    
                else:
    
                    xml.write('\t\n')
    
                    xml.write('\t\t' + labelName.lower()+ '\n')
    
                    xml.write('\t\tUnspecified\n')
    
                    xml.write('\t\t1\n')
    
                    xml.write('\t\t0\n')
    
                    xml.write('\t\t\n')
    
                    xml.write('\t\t\t' + str(int(xmin)) + '\n')
    
                    xml.write('\t\t\t' + str(int(ymin)) + '\n')
    
                    xml.write('\t\t\t' + str(int(xmax)) + '\n')
    
                    xml.write('\t\t\t' + str(int(ymax)) + '\n')
    
                    xml.write('\t\t\n')
    
                    xml.write('\t\n')
    
                    print(json_filename, xmin, ymin, xmax, ymax, label)
    
            xml.write('')
    
    # 5.复制图片到 VOC2007/JPEGImages/下
    
    image_files = glob(labelme_path + "*.JPEG")
    
    print("copy image files to VOC007/JPEGImages/")

    temp2=saved_path+"/Data/VID/train/"+tt
    if not os.path.exists(temp2):
           os.makedirs(temp2)
    
    for image in image_files:
    
        shutil.copy(image, temp2)
    
    # 6.split files for txt
    
    txtsavepath = saved_path + "ImageSets/Main/"
    
    ftrainval = open(txtsavepath + '/trainval.txt', 'w')
    
    ftest = open(txtsavepath + '/test.txt', 'w')
    
    ftrain = open(txtsavepath + '/train.txt', 'w')
    
    fval = open(txtsavepath + '/val.txt', 'w')
    
    total_files = glob("./VOC2007/Annotations/*.xml")
    
    total_files = [i.replace("\\","/").split("/")[-1].split(".xml")[0] for i in total_files]
    
    trainval_files=[]
    
    test_files=[]
    
    if isUseTest:
    
        trainval_files, test_files = train_test_split(total_files, test_size=0.15, random_state=55)
    
    else:
    
        trainval_files=total_files
    
    for file in trainval_files:
    
        ftrainval.write(file+"\n")
    
    # split
    
    train_files, val_files = train_test_split(trainval_files, test_size=0.15, random_state=55)
    
    # train
    
    for file in train_files:
    
        ftrain.write(file + "\n")
    
    # val
    
    for file in val_files:
    
        fval.write(file +"\n")
    
    for file in test_files:
    
        print(file)
    
        ftest.write(file + "\n")
    
    ftrainval.close()
    
    ftrain.close()
    
    fval.close()
    
    ftest.close()

2、当组织好了Annotations和Data的每一个视频一一对应之后,对每一个视频帧文件夹进行重命名排序(我跑的那个模型可能需要,其他的可能不太清楚)

# -*- coding:utf8 -*-
 
import os
 
class BatchRename():
    '''
    批量重命名文件夹中的图片文件
    '''
    def __init__(self):
        self.path = '/home/liutianen/datasets/ILSVRC2015/Data/VID/train'
        
   
           
            
 
    def rename(self):
        filelist = os.listdir(self.path)
        total_num = len(filelist)
        for tt in filelist:
            i = 0
            print(tt)
            ttt=os.listdir('/home/liutianen/datasets/ILSVRC2015/Data/VID/train'+'/'+tt)
            ttt.sort()
            #ttt.sort(key=lambda x:str(x.split('.')[1]))
            print(ttt)
            for item in ttt:
                print(item)
                if item.endswith('.jpg'):
                    temp=' '
                    print(1111111111111)
                    if i<10:
                        temp='00000'+str(i)
                    if i<100 and i>=10:
                        temp='0000'+str(i)
                    if i<1000 and i>=100:
                        temp='000'+str(i)
                    if i>=1000 and i<10000:
                        temp='00'+str(i)
                    if i>=10000:
                        temp=str(i)
                    src = os.path.join(os.path.abspath(self.path), tt+'/'+item)
                    dst = os.path.join(os.path.abspath(self.path), tt+'/'+temp+ '.JPEG')
                    temp=' '
                    print(src)
                    print(dst)
                    
                    try:
                        os.rename(src, dst)
                        i=i+1
                        print('converting %s to %s ...' % (src, dst))
                    except:
                        continue

        print ('total %d to rename & converted %d jpgs' % (total_num, i))
 
if __name__ == '__main__':
    demo = BatchRename()
    demo.rename()

3、制作VID_val_frames.txt等ImageSets文档,大体上每个txt制作差不多,一些细节上的内容可能要更改。

import os
 
from typing import List, Any
 
 
 
import numpy as np
 
import codecs
 
import json
 
from glob import glob
 
import cv2
 
import shutil
 
 
# 1.标签路径
 
path = "/home/liutianen/datasets/ILSVRC2015/Data/VID/val"              #原始labelme标注数据路径
saved_path = "/home/liutianen/datasets/ILSVRC2015"                #保存路径
 
 
 
    # 3.获取待处理文件
file = open('/home/liutianen/datasets/ILSVRC2015/ImageSets/VID_val_frames.txt','w')
dd=os.listdir(path)
dd.sort()
j=1
for tt in dd:
    labelme_path='/home/liutianen/datasets/ILSVRC2015/Data/VID/val'+'/'+tt+'/'
    print(labelme_path)    

    
    image_files = glob(labelme_path + "*.jpg")
    

    temp2=saved_path+"/" +"Data/VID/val/"+tt
    lenth=len(os.listdir(temp2))
    xx="val/"+tt
    ww=os.listdir(temp2)
    ww.sort()
    for aa in ww:
       temp3=xx+"/"+ aa.split('.')[0]+" "+str(j)+"\n"
       file.write(temp3)
       j=j+1
    
    
   

你可能感兴趣的:(深度学习,计算机视觉,python)