Object-Localization-using-Deep-Reinforcement-Learning/extract_data.py at master · ambirpatel/Object-Localization-using-Deep-Reinforcement-Learning · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#%%
import os
from os import listdir
from os.path import isfile, join
import shutil
import xmltodict
import cv2
import pickle
#%%
# Defining constants
ROOT_PATH = "VOC2012"
ANNOTATION_FOLDER = "Annotations"
IMAGE_FOLDER = "JPEGImages"
CLASSES = ["person", "bird", "cat", "cow", "dog", "horse", "sheep", "aeroplane", "bicycle", "boat", "bus", "car",
           "motorbike", "train", "bottle", "chair", "diningtable", "pottedplant", "sofa", "tvmonitor"]

CLASS_TO_LABEL = {class_name: label for (class_name, label) in zip(CLASSES, range(len(CLASSES)))}
#%%
# Defining functions for extracting relevant data from the VOC 2012 database
def extract_objects(xml):
    objects = xml['annotation']['object']
    return [objects] if isinstance(objects,xmltodict.OrderedDict) else objects

def extract_labels(xml):
    return [CLASS_TO_LABEL[object['name']] for object in extract_objects(xml)]

def extract_bounding_boxes(xml):
    return [tuple([int(round(float(object['bndbox'][key])))
                   for key in ['xmin', 'ymin', 'xmax', 'ymax']]) for object in extract_objects(xml)]

def format_data(data):
    data_tuples = [(value["image"],value["labels"],value["bounding_boxes"]) for key,value in data.items()]

    values = [(image, bounding_boxes,labels)
              for (image, labels, bounding_boxes) in data_tuples]

    return values

def process_data():
    annotation_directory_path = os.path.join(ROOT_PATH, ANNOTATION_FOLDER)
    image_directory_path = os.path.join(ROOT_PATH, IMAGE_FOLDER)

    names_and_image_paths_and_xml_paths = [
        (os.path.splitext(filename)[0],join(image_directory_path, os.path.splitext(filename)[0] + ".jpg"), join(annotation_directory_path, filename))

        for filename in listdir(annotation_directory_path)]

    names_and_image_paths_and_xml_paths = [(name,image_path, annotation_path)
                                           for (name,image_path, annotation_path) in names_and_image_paths_and_xml_paths
                                           if isfile(annotation_path)]

    data = {}

    for (name,image_path, annotation_path) in names_and_image_paths_and_xml_paths:
        xml = xmltodict.parse(open(annotation_path, 'rb'))

        labels = extract_labels(xml)
        bounding_boxes = extract_bounding_boxes(xml)

        data[name] = {
            "image":name,
            "labels":labels,
            "bounding_boxes":bounding_boxes
        }
        print("Processed %s" % name)

    formatted_data = format_data(data)
    rl_data = formatted_data

    if os.path.exists('out_rl/imgs'):
        shutil.rmtree('out_rl/imgs')
        os.mkdir('out_rl/imgs')
    else:
        os.mkdir('out_rl')
        os.mkdir('out_rl/imgs')

    for ((image,bounding_boxes,labels),i) in zip(rl_data,range(len(rl_data))):
        image = cv2.imread(ROOT_PATH+'/'+IMAGE_FOLDER+'/'+image+'.jpg')
        cv2.imwrite("out_rl/imgs/"+str(i)+".png",image)
        print(str(i))

    bounding_boxes = [bounding_boxes for (image,bounding_boxes,labels) in rl_data]
    pickle.dump(bounding_boxes, open("out_rl/"+"bounding_boxes.p", "wb"),protocol=4)

    labels_rl = [labels for (image,bounding_boxes,labels) in rl_data]
    pickle.dump(labels_rl, open("out_rl/"+"labels_rl.p", "wb"),protocol=4)
#%%
process_data()
#%%