根據須要修改路徑和本身須要的類便可。app
import os import os.path import shutil fileDir_ann = r'/home/somnus/tttt/VOC2012/Annotations/' fileDir_img = r'/home/somnus/tttt/VOC2012/JPEGImages/' #存放包含須要的類的圖片 saveDir_img = r'/home/somnus/tttt/VOC2012/JPEGImages_ssd/' if not os.path.exists(saveDir_img): os.mkdir(saveDir_img) names = locals() for files in os.walk(fileDir_ann): #遍歷Annotations中的全部文件 for file in files[2]: print file + "-->start!" #存放包含須要的類的圖片對應的xml文件 saveDir_ann = r'/home/somnus/tttt/VOC2012/Annotations_ssd/' if not os.path.exists(saveDir_ann): os.mkdir(saveDir_ann) fp = open(fileDir_ann + file) saveDir_ann = saveDir_ann + file fp_w = open(saveDir_ann, 'w') classes = ['aeroplane','bicycle','bird','boat','bottle','bus','car','cat','chair','cow','diningtable',\ 'dog','horse','motorbike','pottedplant','sheep','sofa','train','tvmonitor','person'] lines = fp.readlines() #記錄全部的\t<object>\n的位置 ind_start = [] #記錄全部的\t</object>\n的位置 ind_end = [] lines_id_start = lines[:] lines_id_end = lines[:] while "\t<object>\n" in lines_id_start: a = lines_id_start.index("\t<object>\n") ind_start.append(a) lines_id_start[a] = "delete" while "\t</object>\n" in lines_id_end: b = lines_id_end.index("\t</object>\n") ind_end.append(b) lines_id_end[b] = "delete" for k in range(0,len(ind_start)): for j in range(0,len(classes)): if classes[j] in lines[ind_start[k]+1]: a = ind_start[k] names['block%d'%k] = lines[a:ind_end[k]+1] break #須要的類 classes1 = '\t\t<name>person</name>\n' string_start = lines[0:ind_start[0]] string_end = lines[ind_end[-1] + 1:] a = 0 for k in range(0,len(ind_start)): if classes1 in names['block%d'%k]: a += 1 string_start += names['block%d'%k] string_start += string_end for c in range(0,len(string_start)): fp_w.write(string_start[c]) fp_w.close() if a == 0: os.remove(saveDir_ann) else: name_img = fileDir_img + os.path.splitext(file)[0] + ".jpg" shutil.copy(name_img,saveDir_img) fp.close()
參考spa