ZeroShotLearning/main.py at main · sebastko/ZeroShotLearning · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
import torch
import torch.nn as nn
import torch.autograd as autograd
import numpy as np
import copy
from tqdm import tqdm, trange

import dataset
from gan import GanTrainer
from classifier import MaskedClassifier, train_cls


def get_dataset_and_print(data, type, device):
    X, y, classes, mask = data.get_dataset(type, device)
    print('---------------')
    print(f'Data set {type}:')
    print(f'  N:          {X.shape[0]}')
    print(f'  classes:    {classes}')
    print(f'  num of cls: {len(classes)}')
    print(f'  mask:       {mask}')
    return X, y, classes, mask

def cli():
    device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')
    print(f'Device: {device}')

    data_features_dir = '/mnt/c/datasets/xlsa17/data/AWA2'
    data = dataset.ParentDataset(data_features_dir)

    total_N, _ = data.features.shape
    train_all_X, train_all_y, train_all_classes, train_all_mask = get_dataset_and_print(data, 'train', device)
    train_all_N, fea_dim = train_all_X.shape

    # TODO: make gin configurable?
    seen_val_ratio = 0.2

    train_N = int(train_all_X.shape[0] * (1-seen_val_ratio))
    train_X, train_y, train_mask = train_all_X[:train_N, :], train_all_y[:train_N], train_all_mask
    val_seen_X, val_seen_y, val_seen_mask = train_all_X[train_N:, :], train_all_y[train_N:], train_all_mask

    val_unseen_X, val_unseen_y, val_unseen_classes, val_unseen_mask = get_dataset_and_print(data, 'val', device)
    test_seen_X, test_seen_y, test_seen_classes, test_seen_mask = get_dataset_and_print(data, 'test_seen', device)
    test_unseen_X, test_unseen_y, test_unseen_classes, test_unseen_mask = get_dataset_and_print(data, 'test_unseen', device)

    assert total_N == train_all_X.shape[0] + val_unseen_X.shape[0] + test_seen_X.shape[0] + test_unseen_X.shape[0]

    # 1. Train a linear softmax classifier P(y|x;θ) on the real features of seen classes.
    print('1. Train a linear softmax classifier P(y|x;θ) on the real features of seen classes.')
    best_linear_cls = train_cls(train_mask, train_X, train_y, val_seen_X, val_seen_y, device)

    # 2. Train  the  conditional f-CLSWGAN generator, conditioned on class attributes a_y
    print('2. Train  the  conditional f-CLSWGAN generator, conditioned on class attributes a_y')

    attr_dim = data.attributes.shape[-1]
    train_attr = torch.FloatTensor(data.attributes[train_y.cpu().detach().numpy()])
    assert train_attr.shape == (train_X.shape[0], attr_dim)
    gan_trainer = GanTrainer(device, fea_dim, attr_dim, attr_dim, classifier=best_linear_cls)

    n_epochs = 10
    for ep in trange(1, n_epochs + 1):
        loss_dis, loss_gen, d_x, d_g_z = gan_trainer.fit_GAN(train_X, train_attr, train_y)
        print("Loss for epoch: %3d - D: %.4f | G: %.4f | D(x) acc: %.4f | D(G(z)) acc: %.4f"\
                %(ep, loss_dis, loss_gen, d_x, d_g_z))

    print('Done!')

    # 3. Augment the training set by generating synthetic examples of unseen classes using generator G.
    print('3. Augment the training set by generating synthetic examples of unseen classes using generator G.')

    n_examples_per_class = train_X.shape[0] // len(val_unseen_classes)
    synth_X, synth_y = gan_trainer.generate_data(val_unseen_classes, data.attributes, n_examples=n_examples_per_class)

    assert train_X.shape[-1] == synth_X.shape[-1]
    assert len(synth_y.shape) == 1
    assert synth_X.shape[0] == synth_y.shape[0]

    # 4. Train the final classifier.
    print('4. Train the final classifier.')

    # ZSL
    print('==================')
    print(' ZSL:')
    print('------------------')
    zsl_cls = train_cls(val_unseen_mask, synth_X, synth_y, val_unseen_X, val_unseen_y, device)

    # GZSL
    print('==================')
    print(' GZSL:')
    print('------------------')
    train_val_mask = train_mask + val_unseen_mask
    gzsl_train_X = torch.cat((train_X, synth_X), dim=0)
    gzsl_train_y = torch.cat((train_y, synth_y), dim=0)
    val_X = torch.cat((val_seen_X, val_unseen_X), dim=0)
    val_y = torch.cat((val_seen_y, val_unseen_y), dim=0)
    final_cls = train_cls(train_val_mask, gzsl_train_X, gzsl_train_y, val_X, val_y, device)


if __name__ == "__main__":
    cli()