examples/domain_adaptation/object_detection/prepare_cityscapes_to_voc.py

from pascal_voc_writer import Writer
import matplotlib.pyplot as plt
import numpy as np
import os
import json
import glob
import time
from shutil import move, copy
import tqdm

classes = {'bicycle': 'bicycle', 'bus': 'bus', 'car': 'car', 'motorcycle': 'motorcycle',
           'person': 'person', 'rider': 'rider', 'train': 'train', 'truck': 'truck'}
classes_keys = list(classes.keys())


def make_dir(path):
    if not os.path.isdir(path):
        os.makedirs(path)

#----------------------------------------------------------------------------------------------------------------
#convert polygon to bounding box
#code from:
#https://stackoverflow.com/questions/46335488/how-to-efficiently-find-the-bounding-box-of-a-collection-of-points
#----------------------------------------------------------------------------------------------------------------
def polygon_to_bbox(polygon):
    x_coordinates, y_coordinates = zip(*polygon)
    return [min(x_coordinates), min(y_coordinates), max(x_coordinates), max(y_coordinates)]


# --------------------------------------------
# read a json file and convert to voc format
# --------------------------------------------
def read_json(file):
    # if no relevant objects found in the image,
    # don't save the xml for the image
    relevant_file = False

    data = []
    with open(file, 'r') as f:
        file_data = json.load(f)

        for object in file_data['objects']:
            label, polygon = object['label'], object['polygon']

            # process only if label found in voc
            if label in classes_keys:
                polygon = np.array([x for x in polygon])
                bbox = polygon_to_bbox(polygon)
                data.append([classes[label]] + bbox)

        # if relevant objects found in image, set the flag to True
        if data:
            relevant_file = True

    return data, relevant_file


#---------------------------
#function to save xml file
#---------------------------
def save_xml(img_path, img_shape, data, save_path):
    writer = Writer(img_path,img_shape[1], img_shape[0])
    for element in data:
        writer.addObject(element[0],element[1],element[2],element[3],element[4])
    writer.save(save_path)


def prepare_cityscapes_to_voc(cityscapes_dir, save_path, suffix, image_dir):
    cityscapes_dir_gt = os.path.join(cityscapes_dir, 'gtFine')

    # ------------------------------------------
    # reading json files from each subdirectory
    # ------------------------------------------
    valid_files = []
    trainval_files = []
    test_files = []

    # make Annotations target directory if already doesn't exist
    ann_dir = os.path.join(save_path, 'Annotations')
    make_dir(ann_dir)

    start = time.time()
    for category in os.listdir(cityscapes_dir_gt):

        # # no GT for test data
        # if category == 'test':
        #     continue

        for city in tqdm.tqdm(os.listdir(os.path.join(cityscapes_dir_gt, category))):

            # read files
            files = glob.glob(os.path.join(cityscapes_dir, 'gtFine', category, city) + '/*.json')

            # process json files
            for file in files:
                data, relevant_file = read_json(file)

                if relevant_file:
                    base_filename = os.path.basename(file)[:-21]
                    xml_filepath = os.path.join(ann_dir, base_filename + '{}.xml'.format(suffix))
                    img_name = base_filename + '{}.png'.format(suffix)
                    img_path = os.path.join(cityscapes_dir, image_dir, category, city,
                                            base_filename + '{}.png'.format(suffix))
                    img_shape = plt.imread(img_path).shape
                    valid_files.append([img_path, img_name])

                    # make list of trainval and test files for voc format
                    # lists will be stored in txt files
                    trainval_files.append(img_name[:-4]) if category == 'train' else test_files.append(img_name[:-4])

                    # save xml file
                    save_xml(os.path.join(image_dir, category, city,
                                            base_filename + '{}.png'.format(suffix)), img_shape, data, xml_filepath)

    end = time.time() - start
    print('Total Time taken: ', end)

    # ----------------------------
    # copy files into target path
    # ----------------------------
    images_savepath = os.path.join(save_path, 'JPEGImages')
    make_dir(images_savepath)

    start = time.time()
    for file in valid_files:
        copy(file[0], os.path.join(images_savepath, file[1]))

    print('Total Time taken: ', end)

    # ---------------------------------------------
    # create text files of trainval and test files
    # ---------------------------------------------
    textfiles_savepath = os.path.join(save_path, 'ImageSets', 'Main')
    make_dir(textfiles_savepath)

    traival_files_wr = [x + '\n' for x in trainval_files]
    test_files_wr = [x + '\n' for x in test_files]

    with open(os.path.join(textfiles_savepath, 'trainval.txt'), 'w') as f:
        f.writelines(traival_files_wr)

    with open(os.path.join(textfiles_savepath, 'test.txt'), 'w') as f:
        f.writelines(test_files_wr)


if __name__ == '__main__':
    cityscapes_dir = 'datasets/cityscapes/'
    if not os.path.exists(cityscapes_dir):
        print("Please put cityscapes datasets in: {}".format(cityscapes_dir))
        exit(0)
    save_path = 'datasets/cityscapes_in_voc/'
    suffix = "_leftImg8bit"
    image_dir = "leftImg8bit"
    prepare_cityscapes_to_voc(cityscapes_dir, save_path, suffix, image_dir)

    save_path = 'datasets/foggy_cityscapes_in_voc/'
    suffix = "_leftImg8bit_foggy_beta_0.02"
    image_dir = "leftImg8bit_foggy"
    prepare_cityscapes_to_voc(cityscapes_dir, save_path, suffix, image_dir)