keras_yolo3_detection/data_annotations.py at master · 99312254/keras_yolo3_detection · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
import xml.etree.ElementTree as ET
import os


def convert_annotation(annotation_path, image_id, list_file, classes):
    in_file = open(annotation_path + '%s.xml' % image_id)
    tree = ET.parse(in_file)
    root = tree.getroot()
    image_path = root.findall("path")[0].text
    list_file.write('%s' % image_path)
    for obj in root.iter('object'):
        difficult = obj.find('difficult').text
        cls = obj.find('name').text
        if cls not in classes or int(difficult) == 1:
            continue
        cls_id = classes.index(cls)
        xmlbox = obj.find('bndbox')
        b = (int(xmlbox.find('xmin').text), int(xmlbox.find('ymin').text), int(xmlbox.find('xmax').text), int(xmlbox.find('ymax').text))
        list_file.write(" " + ",".join([str(a) for a in b]) + ',' + str(cls_id))
    list_file.write('\n')


def conver_to_train_list_txt(annotation_path, classes, output_file_dir, train_split=0.8):
    xml_names = os.listdir(annotation_path)
    image_ids = [xml_name[0:-4] for xml_name in xml_names]
    train_data_nums = int(train_split * len(image_ids))
    list_file = open(output_file_dir + 'train_list.txt', 'w')
    list_file_test = open(output_file_dir + 'test_list.txt', 'w')
    for i, image_id in enumerate(image_ids):
        if i < train_data_nums:
            convert_annotation(annotation_path, image_id, list_file, classes)
        else:
            convert_annotation(annotation_path, image_id, list_file_test, classes)
    list_file.close()
    print("convert secessfully! ")
    print("train_nums: %d " % train_data_nums)
    print("test_nums: %d " % (len(image_ids) - train_data_nums))


"""xml_file_path为标注后的XML文件路径，image_path为所标注的图片的路径（该路径下图片数量与标记数量要一致），
output_txtfile_dir为输出的trainlist文件的路径，该文件包含了image的路径的bbox信息。"""

xml_file_path = 'D:\\project3\\chef_hats\\data_augmentation\\annotations\\'
classes = ["head"]  # 可添加所有的class name
train_test_list_txt__dir = 'D:\\project3\\chef_hats\\'
conver_to_train_list_txt(xml_file_path, classes, train_test_list_txt__dir)