darknet/scripts/get_openimages_dataset.py

import csv
import os

#select classes you want to download at https://github.com/openimages/dataset/blob/master/dict.csv
CLASS_LIST = ('/m/01g317','/m/04yx4')
img_name = "111111111111"

#download csv from https://storage.googleapis.com/openimages/web/download.html
with open('path\\train-annotations-bbox.csv', newline='') as csvfile:
    bboxs = csv.reader(csvfile, delimiter=',', quotechar='|')
    for bbox in bboxs:
        if bbox[2] in CLASS_LIST:
            if img_name != bbox[0]:
                if not os.path.isfile("destination_path\\%s.jpg"%bbox[0]):
                    os.system("gsutil cp gs://open-images-dataset/train/%s.jpg destination_path"%bbox[0])
                    out_file = open("destination_path\\%s.txt"%bbox[0], 'w')
                    img_name = bbox[0]
            if img_name == bbox[0]:
                out_file.write(str(CLASS_LIST.index(bbox[2])) + " " + str(float(bbox[4])+(float(bbox[5])-float(bbox[4]))/2) + " " + str(float(bbox[6])+(float(bbox[7])-float(bbox[6]))/2)+ " " + str(float(bbox[5])-float(bbox[4])) + " " + str(float(bbox[7])-float(bbox[6])) + '\n')
Create get_openimages_dataset.py Script that downloads images with selected classes from OpenImages dataset and create labels in "yolo format" 2018-05-17 21:22:49 +08:00			`import csv`
			`import os`

			`#select classes you want to download at https://github.com/openimages/dataset/blob/master/dict.csv`
			`CLASS_LIST = ('/m/01g317','/m/04yx4')`
			`img_name = "111111111111"`

			`#download csv from https://storage.googleapis.com/openimages/web/download.html`
			`with open('path\\train-annotations-bbox.csv', newline='') as csvfile:`
			`bboxs = csv.reader(csvfile, delimiter=',', quotechar='\|')`
			`for bbox in bboxs:`
			`if bbox[2] in CLASS_LIST:`
			`if img_name != bbox[0]:`
			`if not os.path.isfile("destination_path\\%s.jpg"%bbox[0]):`
			`os.system("gsutil cp gs://open-images-dataset/train/%s.jpg destination_path"%bbox[0])`
			`out_file = open("destination_path\\%s.txt"%bbox[0], 'w')`
			`img_name = bbox[0]`
			`if img_name == bbox[0]:`
			`out_file.write(str(CLASS_LIST.index(bbox[2])) + " " + str(float(bbox[4])+(float(bbox[5])-float(bbox[4]))/2) + " " + str(float(bbox[6])+(float(bbox[7])-float(bbox[6]))/2)+ " " + str(float(bbox[5])-float(bbox[4])) + " " + str(float(bbox[7])-float(bbox[6])) + '\n')`