Fully-Convolutional-Networks/batch_datset_reader.py at master · qhan1028/Fully-Convolutional-Networks · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
"""
Code ideas from https://github.com/Newmu/dcgan and tensorflow mnist dataset reader
"""
import numpy as np
import scipy.misc as misc
import os.path as osp
import cv2

class BatchDatset:
    files = []
    images = []
    annotations = []
    image_options = {}
    batch_offset = 0
    epochs_completed = 0

    def __init__(self, records_list, image_options={}, mode='train'):
        """
        Initialize a generic file reader with batching for list of files
        :param records_list: list of file records to read -
        sample record: {'image': f, 'annotation': annotation_file, 'filename': filename}
        :param image_options: A dictionary of options for modifying the output image
        Available options:
        resize = True / False
        resize_size = # size of output image - does bilinear resize
        color=True / False
        """
        print("> [BDR] Initializing Batch Dataset Reader...")
        print('> [BDR] Image options:', image_options)
        self.files = records_list
        self.image_options = image_options
        self.npz_file = 'Data_zoo/' + mode + '_data.npz'
        self._read_images(mode)

    def _read_images(self, mode):
        if osp.exists(self.npz_file):
            print('> [BDR] Found ' + mode + ' npz file!')
            data = np.load(self.npz_file)
            self.images = data['images']
            self.annotations = data['annotations']
        else:
            self.__channels = True
            self.images = np.array( [self._transform(filename['image']) for filename in self.files])
            self.__channels = False
            self.annotations = np.array( [np.expand_dims(self._transform(filename['annotation']), axis=3) for filename in self.files])
            np.savez(self.npz_file, images=self.images, annotations=self.annotations)

        print('> [BDR] Images shape:', self.images.shape)
        print('> [BDR] Annotations shape:', self.annotations.shape)

    def _transform(self, filename):
        image = cv2.imread(filename)
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        if self.__channels and len(image.shape) < 3:  # make sure images are of shape(h,w,3)
            image = np.array([image for i in range(3)])

        if self.image_options.get("resize", False) and self.image_options["resize"]:
            resize_height = int(self.image_options["resize_height"])
            resize_width = int(self.image_options["resize_width"])
            #resize_image = misc.imresize(image, [resize_height, resize_width], interp='nearest')
            resize_image = cv2.resize(image, (resize_width, resize_height), interpolation=cv2.INTER_CUBIC)

        else:
            resize_image = image

        return np.array(resize_image)

    def get_records(self):
        return self.images, self.annotations

    def reset_batch_offset(self, offset=0):
        self.batch_offset = offset

    def next_batch(self, batch_size):
        start = self.batch_offset
        self.batch_offset += batch_size
        if self.batch_offset > self.images.shape[0]:
            # Finished epoch
            self.epochs_completed += 1
            print("****************** Epochs completed: " + str(self.epochs_completed) + "******************")
            # Shuffle the data
            perm = np.arange(self.images.shape[0])
            np.random.shuffle(perm)
            self.images = self.images[perm]
            self.annotations = self.annotations[perm]
            # Start next epoch
            start = 0
            self.batch_offset = batch_size

        end = self.batch_offset
        return self.images[start:end], self.annotations[start:end]

    def get_random_batch(self, batch_size):
        indexes = np.random.randint(0, self.images.shape[0], size=[batch_size]).tolist()
        return self.images[indexes], self.annotations[indexes]