polytab/DataGenerator.py at main · vanajmoorthy/polytab · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
# This code was adapted from the TabCNN project
# https://github.com/andywiggins/tab-cnn/blob/master/model/DataGenerator.py

import numpy as np
import keras
from keras.utils import Sequence


class DataGenerator(Sequence):
    # Sets up the generator with the dataset IDs, path to data, batch size, whether to shuffle,
    # the dimensions of the input data (X_dim), and labels (y_dim).
    def __init__(self, list_IDs, data_path="./cqt/", batch_size=128, shuffle=True, label_dim=(6, 21), con_win_size=9):
        self.list_IDs = list_IDs
        self.data_path = data_path
        self.batch_size = batch_size
        self.shuffle = shuffle
        self.label_dim = label_dim
        self.con_win_size = con_win_size
        self.halfwin = con_win_size // 2
        self.X_dim = (self.batch_size, 192, self.con_win_size, 1)
        self.y_dim = (self.batch_size, self.label_dim[0], self.label_dim[1])
        self.on_epoch_end()

    # Returns the number of batches per epoch by dividing the total number of data
    # points by the batch size.
    def __len__(self):
        return int(np.floor(float(len(self.list_IDs)) / self.batch_size))

    # Retrieves a batch at the specified index, with the data (X) and labels (y) for that batch.
    def __getitem__(self, index):
        indexes = self.indexes[index*self.batch_size:(index+1)*self.batch_size]

        list_IDs_temp = [self.list_IDs[k] for k in indexes]

        X, y = self.__data_generation(list_IDs_temp)

        return X, y

    # Shuffles the order of the dataset IDs at the end of each epoch if shuffling is enabled, to
    # ensure that the model does not see the data in the same order after each epoch.
    def on_epoch_end(self):
        self.indexes = np.arange(len(self.list_IDs))
        if self.shuffle == True:
            np.random.shuffle(self.indexes)

    # Generates a batch of data by loading the specified files, padding the data to maintain
    # consistency in input shape, and returning the inputs and labels for the batch. It handles
    # data loading and preprocessing steps like padding and reshaping to get it ready for the model.
    def __data_generation(self, list_IDs_temp):
        X = np.empty(self.X_dim)
        y = np.empty(self.y_dim)

        for i, ID in enumerate(list_IDs_temp):

            data_dir = self.data_path + "/"
            filename = "_".join(ID.split("_")[:-1]) + ".npz"
            frame_idx = int(ID.split("_")[-1])

            loaded = np.load(data_dir + filename)
            full_x = np.pad(loaded["repr"], [
                            (self.halfwin, self.halfwin), (0, 0)], mode='constant')
            sample_x = full_x[frame_idx: frame_idx + self.con_win_size]
            X[i,] = np.expand_dims(np.swapaxes(sample_x, 0, 1), -1)

            y[i,] = loaded["labels"][frame_idx]

        return X, y