ICode9

精准搜索请尝试: 精确搜索
首页 > 其他分享> 文章详细

统计VOC数据集中数目

2022-04-29 21:32:16  阅读:236  来源: 互联网

标签:VOC pic label file print total 数目 annotation 统计


统计VOC数据集中种类与对应图片数目,目标个数:

首先需要获取xml文件中种类名称,代码如下:
import xml.dom.minidom as xmldom
import os

#voc数据集获取所有标签的所有类别数"
annotation_path="D:\\TensorflowModels\\ImageData\Pascal_VOC_2007_CatAndDog\\Annotations"

annotation_names=[os.path.join(annotation_path,i) for i in os.listdir(annotation_path)]

labels = list()
for names in annotation_names:
    xmlfilepath = names
    domobj = xmldom.parse(xmlfilepath)
    # 得到元素对象
    elementobj = domobj.documentElement
    #获得子标签
    subElementObj = elementobj.getElementsByTagName("object")
    for s in subElementObj:
        label=s.getElementsByTagName("name")[0].firstChild.data
        #print(label)
        if label not in labels:
            labels.append(label)
print(labels)

自己制做的数据集种类如下:

之后获取种类所对应的xml文件数量与对应的目标个数,代码如下:

import re
import os
import xml.etree.ElementTree as ET
class1 = 'buou'
class2 = 'huangquan'
class3 = 'jumao'
class4 = 'labuladuo'
class5 = 'lihuamao'
class6 = 'meiduan'
class7 = 'taidi'
class8 = 'xueqiaoquan'
'''class9 = 'chair'
class10 = 'cow'
class11 = 'diningtable'
class12 = 'dog'
class13 = 'horse'
class14 = 'motorbike'
class15 = 'person'
class16 = 'pottedplant'
class17 = 'sheep'
class18 = 'sofa'
class19 = 'train'
class20 = 'tvmonitor'
'''
annotation_folder = 'D:\\TensorflowModels\\ImageData\Pascal_VOC_2007_CatAndDog\\Annotations'  #改为⾃⼰标签⽂件夹的路径
#annotation_folder = '/home/.../VOC2007/Annotations/'
list = os.listdir(annotation_folder)
def file_name(file_dir):
 L = []
 for root, dirs, files in os.walk(file_dir):
  for file in files:
   if os.path.splitext(file)[1] == '.xml':
    L.append(os.path.join(root, file))
 return L
total_number1 = 0
total_number2 = 0
total_number3 = 0
total_number4 = 0
total_number5 = 0
total_number6 = 0
total_number7 = 0
total_number8 = 0
'''total_number9 = 0
total_number10 = 0
total_number11 = 0
total_number12 = 0
total_number13 = 0
total_number14 = 0
total_number15 = 0
total_number16 = 0
total_number17 = 0
total_number18 = 0
total_number19 = 0
total_number20 = 0'''
total = 0
total_pic=0

pic_num1 = 0
pic_num2 = 0
pic_num3 = 0
pic_num4 = 0
pic_num5 = 0
pic_num6 = 0
pic_num7 = 0
pic_num8 = 0
'''pic_num9 = 0
pic_num10 = 0
pic_num11 = 0
pic_num12 = 0
pic_num13 = 0
pic_num14 = 0
pic_num15 = 0
pic_num16 = 0
pic_num17 = 0
pic_num18 = 0
pic_num19 = 0
pic_num20 = 0'''

flag1 = 0
flag2 = 0
flag3 = 0
flag4 = 0
flag5 = 0
flag6 = 0
flag7 = 0
flag8 = 0
'''flag9 = 0
flag10 = 0
flag11 = 0
flag12 = 0
flag13 = 0
flag14 = 0
flag15= 0
flag16 = 0
flag17 = 0
flag18 = 0
flag19 = 0
flag20 = 0'''

xml_dirs = file_name(annotation_folder)
for i in range(0, len(xml_dirs)):
 print(xml_dirs[i])
 #path = os.path.join(annotation_folder,list[i])
 #print(path)
 annotation_file = open(xml_dirs[i]).read()
 root = ET.fromstring(annotation_file)
 #tree = ET.parse(annotation_file)
 #root = tree.getroot()
 total_pic = total_pic + 1
 for obj in root.findall('object'):
  label = obj.find('name').text
  if label == class1:
   total_number1=total_number1+1
   flag1=1
   total = total + 1
   #print("bounding box number:", total_number1)
  if label == class2:
   total_number2=total_number2+1
   flag2=1
   total = total + 1
  if label == class3:
   total_number3=total_number3+1
   flag3=1
   total = total + 1
  if label == class4:
   total_number4=total_number4+1
   flag4=1
   total = total + 1
  if label == class5:
   total_number5=total_number5+1
   flag5=1
   total = total + 1
  if label == class6:
   total_number6=total_number6+1
   flag6=1
   total = total + 1
  if label == class7:
   total_number7=total_number7+1
   flag7=1
   total = total + 1
  if label == class8:
   total_number8=total_number8+1
   flag8=1
   total = total + 1
  '''if label == class9:
   total_number9=total_number9+1
   flag9=1
   total = total + 1
  if label == class10:
   total_number10=total_number10+1
   flag10=1
   total = total + 1
  if label == class11:
   total_number11=total_number11+1
   flag11=1
   total = total + 1
  if label == class12:
   total_number12=total_number12+1
   flag12=1
   total = total + 1
  if label == class13:
   total_number13=total_number13+1
   flag13=1
   total = total + 1
  if label == class14:
   total_number14=total_number14+1
   flag14=1
   total = total + 1
  if label == class15:
   total_number15=total_number15+1
   flag15=1
   total = total + 1
  if label == class16:
   total_number16=total_number16+1
   flag16=1
   total = total + 1
  if label == class17:
   total_number17=total_number17+1
   flag17=1
   total = total + 1
  if label == class18:
   total_number18=total_number18+1
   flag18=1
   total = total + 1
  if label == class19:
   total_number19=total_number19+1
   flag19=1
   total = total + 1
  if label == class20:
   total_number20=total_number20+1
   flag20=1
   total = total + 1'''
 if flag1==1:
  pic_num1=pic_num1+1
  #print("pic number:", pic_num1)
  flag1=0
 if flag2==1:
  pic_num2=pic_num2+1
  flag2=0
 if flag3==1:
  pic_num3=pic_num3+1
  flag3=0
 if flag4==1:
  pic_num4=pic_num4+1
  flag4=0
 if flag5==1:
  pic_num5=pic_num5+1
  flag5=0
 if flag6==1:
  pic_num6=pic_num6+1
  flag6=0
 if flag7==1:
  pic_num7=pic_num7+1
  flag7=0
 if flag8==1:
  pic_num8=pic_num8+1
  flag8=0
 '''if flag9==1:
  pic_num9=p
  flag7=0
 if flag8==1:
  pic_num8=pic_num8+1
  flag8=0
 if flag9==1:
  pic_num9=pic_num9+1
  flag9=0
 if flag10==1:
  pic_num10=pic_num10+1
  flag10=0
 if flag11==1:
  pic_num11=pic_num11+1
  flag11=0
 if flag12==1:
  pic_num12=pic_num12+1
  flag12=0
 if flag13==1:
  pic_num13=pic_num13+1
  flag13=0
 if flag14==1:
  pic_num14=pic_num14+1
  flag14=0
 if flag15==1:
  pic_num15=pic_num15+1
  flag15=0
 if flag16==1:
  pic_num16=pic_num16+1
  flag16=0
 if flag17==1:
  pic_num17=pic_num17+1
  flag17=0
 if flag18==1:
  pic_num18=pic_num18+1
  flag18=0
 if flag19==1:
  pic_num19=pic_num19+1
  flag19=0
 if flag20==1:
  pic_num20=pic_num20+1
  flag20=0'''
print(class1,pic_num1,total_number1)
print(class2,pic_num2,total_number2)
print(class3,pic_num3, total_number3)
print(class4,pic_num4, total_number4)
print(class5,pic_num5, total_number5)
print(class6,pic_num6, total_number6)
print(class7,pic_num7, total_number7)
print(class8,pic_num8, total_number8)
'''print(class9,pic_num9, total_number9)
print(class10,pic_num10, total_number10)
print(class11,pic_num11,total_number11)
print(class12,pic_num12,total_number12)
print(class13,pic_num13, total_number13)
print(class14,pic_num14, total_number14)
print(class15,pic_num15, total_number15)
print(class16,pic_num16, total_number16)
print(class17,pic_num17, total_number17)
print(class18,pic_num18, total_number18)
print(class19,pic_num19, total_number19)
print(class20,pic_num20, total_number20)'''
print("total", total_pic, total)

检测结果如下:

参考资料:

https://blog.csdn.net/qq_38441692/article/details/104183666?spm=1001.2101.3001.6650.1&utm_medium=distribute.pc_relevant.none-task-blog-2~default~CTRLIST~default-1.pc_relevant_default&depth_1-utm_source=distribute.pc_relevant.none-task-blog-2~default~CTRLIST~default-1.pc_relevant_default&utm_relevant_index=2

https://wenku.baidu.com/view/fb96521e13661ed9ad51f01dc281e53a580251b1.html

标签:VOC,pic,label,file,print,total,数目,annotation,统计
来源: https://www.cnblogs.com/kxqblog/p/16208342.html

本站声明: 1. iCode9 技术分享网(下文简称本站)提供的所有内容,仅供技术学习、探讨和分享;
2. 关于本站的所有留言、评论、转载及引用,纯属内容发起人的个人观点,与本站观点和立场无关;
3. 关于本站的所有言论和文字,纯属内容发起人的个人观点,与本站观点和立场无关;
4. 本站文章均是网友提供,不完全保证技术分享内容的完整性、准确性、时效性、风险性和版权归属;如您发现该文章侵犯了您的权益,可联系我们第一时间进行删除;
5. 本站为非盈利性的个人网站,所有内容不会用来进行牟利,也不会利用任何形式的广告来间接获益,纯粹是为了广大技术爱好者提供技术内容和技术思想的分享性交流网站。

专注分享技术,共同学习,共同进步。侵权联系[81616952@qq.com]

Copyright (C)ICode9.com, All Rights Reserved.

ICode9版权所有