PreprocessingOfficeImages/split_to_five.py at master · iss4e/PreprocessingOfficeImages · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
import os
from PIL import Image, ImageDraw
from collections import defaultdict
import sys
from shutil import copyfile
from tqdm import tqdm
import random

"""
Split the images in the input folder into 4 quadrants + center, preserving their label in a txt file.
Each split image is appended with a 0 to 4 (depending on its spatial position) in its name.
The label for the image is found in the corresponding txt file.

To use: python split_to_five.py <input folder> <output folder path>

Note:
The current script drops 150 of the positive examples corresponding to the vector 00010.
This is due to the nature of the data, and should be modified if necessary.

"""


def split_image(image_name):

    img_path = os.path.join(image_folder_path, image_name + '.jpg')
    img = Image.open(img_path)

    width, height = img.size

    top_left = img.crop((0,0, width/2, height/2))
    top_right = img.crop((width/2, 0, width, height/2))


    bottom_left = img.crop((0, height/2, width/2, height - 1)) # need to sub 1 because width or height is uneven
    bottom_right = img.crop((width/2, height/2, width, height - 1))

    center_factor = 104


    center = img.crop((width/4 - center_factor, height/4, 3*width/4 - center_factor, 3*height/4 - 1))

    split_images = [top_left, top_right, bottom_left, bottom_right, center] # order is important due to indexing

    return split_images


image_folder_path = sys.argv[1]
output_path = sys.argv[2]

listOfFiles = os.listdir(image_folder_path)
lenFiles = len(listOfFiles)

category_to_image = defaultdict(list)

for i, filename in enumerate(listOfFiles):
    name, ext = filename.split('.')

    if ext == 'txt':
        with open(os.path.join(image_folder_path, filename), 'r') as f:
            category = f.read()
            category_to_image[category].append(name)

# HACK: Drop some of the training examples which only contain a bottom right person
# This is due to the nature of the gathered data

right_bottom_images = category_to_image["00010"]
random.shuffle(right_bottom_images)
category_to_image["00010"] = right_bottom_images[:150]

for category, image_list in category_to_image.iteritems():
    #print "{}  has {} elements".format(category, len(image_list))
    assert len(category) == 5

    for image in tqdm(image_list):
        split_images = split_image(image)

        for i, binary_value  in enumerate(category):

            split_name = "{}&{}".format(image, i)

            split_images[i].save(os.path.join(output_path, split_name + '.jpg'))

            txt_path = os.path.join(output_path, split_name + '.txt')

            with open(txt_path, 'w+') as txt_file:
                txt_file.write(binary_value)