dataprocessor.py

import numpy as np
import cv2


class BatchPreprocessor(object):

    def __init__(self, dataset_file_path, num_classes, output_size=[227, 227], horizontal_flip=False, shuffle=False,
                 mean_color=[104.0069879317889,116.66876761696767,122.6789143406786], multi_scale=None,istraining=True):
        self.num_classes = num_classes
        self.output_size = output_size
        self.horizontal_flip = horizontal_flip
        self.shuffle = shuffle
        self.mean_color = mean_color
        self.multi_scale = multi_scale
        self.istraining=istraining
        self.pointer = 0
        self.images = []
        self.labels = []
        # Read the dataset file
        dataset_file = open(dataset_file_path)
        lines = dataset_file.readlines()
        self.classpaths=[]
        for i in xrange(31):
            self.classpaths.append([])
        for line in lines:
            items = line.split()
            self.images.append(items[0])
            self.labels.append(int(items[1]))
        for j in xrange(len(self.labels)):
            label=self.labels[j]
            self.classpaths[label].append(j)

        # Shuffle the data
        if self.shuffle:
            self.shuffle_data()

    def shuffle_data(self):
        images = self.images[:]
        labels = self.labels[:]
        self.images = []
        self.labels = []

        idx = np.random.permutation(len(labels))
        for i in idx:
            self.images.append(images[i])
            self.labels.append(labels[i])

    def reset_pointer(self):
        self.pointer = 0
        if self.shuffle:
            self.shuffle_data()
    def class_next_batch(self,num_per_class):
        batch_size=31*num_per_class
        ids=[]
        for i in xrange(31):
            ids+=np.random.choice(self.classpaths[i],size=num_per_class,replace=False).tolist()
        selfimages=np.array(self.images)
        selflabels=np.array(self.labels)
        paths=selfimages[ids]
        labels=selflabels[ids]
        # Read images
        images = np.ndarray([num_per_class*31, self.output_size[0], self.output_size[1], 3])
        for i in range(len(paths)):
            img = cv2.imread(paths[i])
            # Flip image at random if flag is selected
            if self.horizontal_flip and np.random.random() < 0.5:
                img = cv2.flip(img, 1)
            if self.multi_scale is None:
                # Resize the image for output
                img = cv2.resize(img, (self.output_size[0], self.output_size[0]))
                img = img.astype(np.float32)
            elif isinstance(self.multi_scale, list):
                # Resize to random scale
                new_size = np.random.randint(self.multi_scale[0], self.multi_scale[1], 1)[0]
                img = cv2.resize(img, (new_size, new_size))
                img = img.astype(np.float32)
                if new_size!=self.output_size[0]:
                    if self.istraining:
                        # random crop at output size
                        diff_size = new_size - self.output_size[0]
                        random_offset_x = np.random.randint(0, diff_size, 1)[0]
                        random_offset_y = np.random.randint(0, diff_size, 1)[0]
                        img = img[random_offset_x:(random_offset_x+self.output_size[0]),
                                  random_offset_y:(random_offset_y+self.output_size[0])]
                    else:
                        y,x,_=img.shape
                        startx=x//2-self.output_size[0]//2
                        starty=y//2-self.output_size[1]//2
                        img=img[starty:starty+self.output_size[0],startx:startx+self.output_size[1]]
            # Subtract mean color
            img -= np.array(self.mean_color)

            images[i] = img
        # Expand labels to one hot encoding
        one_hot_labels = np.zeros((batch_size, self.num_classes))
        for i in range(len(labels)):
            one_hot_labels[i][labels[i]] = 1
        # Return array of images and labels
        return images, one_hot_labels

    def next_batch(self, batch_size):
        # Get next batch of image (path) and labels
        paths = self.images[self.pointer:(self.pointer+batch_size)]
        labels = self.labels[self.pointer:(self.pointer+batch_size)]

        # Update pointer
        self.pointer += batch_size

        # Read images
        images = np.ndarray([batch_size, self.output_size[0], self.output_size[1], 3])
        for i in range(len(paths)):
            img = cv2.imread(paths[i])
            # Flip image at random if flag is selected
            if self.horizontal_flip and np.random.random() < 0.5:
                img = cv2.flip(img, 1)

            if self.multi_scale is None:
                # Resize the image for output
                img = cv2.resize(img, (self.output_size[0], self.output_size[0]))
                img = img.astype(np.float32)
            elif isinstance(self.multi_scale, list):
                # Resize to random scale
                new_size = np.random.randint(self.multi_scale[0], self.multi_scale[1], 1)[0]
                img = cv2.resize(img, (new_size, new_size))
                img = img.astype(np.float32)
                if new_size!=self.output_size[0]:
                    if self.istraining:
                        # random crop at output size
                        diff_size = new_size - self.output_size[0]
                        random_offset_x = np.random.randint(0, diff_size, 1)[0]
                        random_offset_y = np.random.randint(0, diff_size, 1)[0]
                        img = img[random_offset_x:(random_offset_x+self.output_size[0]),
                                  random_offset_y:(random_offset_y+self.output_size[0])]
                    else:
                        y,x,_=img.shape
                        startx=x//2-self.output_size[0]//2
                        starty=y//2-self.output_size[1]//2
                        img=img[starty:starty+self.output_size[0],startx:startx+self.output_size[1]]
            # Subtract mean color
            img -= np.array(self.mean_color)

            images[i] = img

        # Expand labels to one hot encoding
        one_hot_labels = np.zeros((batch_size, self.num_classes))
        for i in range(len(labels)):
            one_hot_labels[i][labels[i]] = 1

        # Return array of images and labels
        return images, one_hot_labels