final-project-code-cs281/neuralnet_multitask.py at master · serenalwang/final-project-code-cs281 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
from __future__ import absolute_import
from __future__ import print_function
import matplotlib.pyplot as plt

import autograd.numpy as np
import autograd.numpy.random as npr
import autograd.scipy.stats.norm as norm
from autograd import grad

from optimizers import adam
import ascdata

def make_nn_funs(layer_sizes, weight_scale=10.0, noise_scale=0.1, nonlinearity=np.tanh):
    """These functions implement a standard multi-layer perceptron."""
    shapes = zip(layer_sizes[:-1], layer_sizes[1:])
    num_weights = sum((m+1)*n for m, n in shapes)

    def unpack_layers(weights):
        for m, n in shapes:
            cur_layer_weights = weights[:m*n]     .reshape((m, n))
            cur_layer_biases  = weights[m*n:m*n+n].reshape((1, n))
            yield cur_layer_weights, cur_layer_biases
            weights = weights[(m+1)*n:]

    def predictions(weights, inputs):
        for W, b in unpack_layers(weights):
            outputs = np.dot(inputs, W) + b
            inputs = nonlinearity(outputs)
        return outputs

    def logprob(weights, inputs, targets):
        log_prior = np.sum(norm.logpdf(weights, 0, weight_scale))
        preds = predictions(weights, inputs)
        log_lik = np.sum(norm.logpdf(preds, targets, noise_scale))
        return log_prior + log_lik

    return num_weights, predictions, logprob


def build_toy_dataset(n_data=80, noise_std=0.1, D=1):
    rs = npr.RandomState(0)
    inputs  = np.concatenate([np.linspace(0, 3, num=n_data/2),
                              np.linspace(6, 8, num=n_data/2)])
    targets = np.cos(inputs) + rs.randn(n_data) * noise_std
    inputs = (inputs - 4.0) / 2.0
    inputs  = inputs.reshape((len(inputs), D))
    targets = targets.reshape((len(targets), D)) / 2.0
    return inputs, targets

if __name__ == '__main__':

    # Specify inference problem by its unnormalized log-posterior.
    rbf  = lambda x: np.exp(-x**2)
    relu = lambda x: np.maximum(x, 0.0)

    # Implement a 3-hidden layer neural network.
    num_weights, predictions, logprob = \
        make_nn_funs(layer_sizes=[34, 100, 100, 100, 1], nonlinearity=rbf)

    # inputs, targets = build_toy_dataset()
    inputs, targets = ascdata.get_asc_data()

    objective = lambda weights, t: -logprob(weights, inputs, targets)

    def plot_initial_data(inX, iny, ax):
        plot_inputs = inX.T[2]
        ax.plot(plot_inputs, iny.ravel(), 'bx')

    X_bp1, y_bp1 = ascdata.get_bp_data(1, 4194659, inputs, targets)
    X_bp2, y_bp2 = ascdata.get_bp_data(3, 4194873, inputs, targets)

    # Set up figure.
    fig = plt.figure(1, facecolor='white')
    ax1 = fig.add_subplot(211, frameon=False)
    ax2 = fig.add_subplot(212, frameon=False)

    plot_initial_data(X_bp1, y_bp1, ax1)
    plot_initial_data(X_bp2, y_bp2, ax2)

    plt.show(block=False)

    def plot_prediction_data(inX, iny, params, ax, subplot_no):
        ax.cla()

        # Plot data and functions.
        plot_inputs = inX.T[2]
        ax.plot(plot_inputs, iny.ravel(), 'bx')
        outputs = predictions(params, inX)
        ax.plot(plot_inputs, outputs)

    LLHs = []
    LLH_xs = []

    def callback(params, t, g):
        LLH = -objective(params, t)
        LLH_xs.append(t)
        print("Iteration {} log likelihood {}".format(t, LLH))
        LLHs.append(LLH)

        plot_prediction_data(X_bp1, y_bp1, params, ax1, 211)
        plot_prediction_data(X_bp2, y_bp2, params, ax2, 212)
        plt.draw()
        #plt.pause(1.0/60.0)

    rs = npr.RandomState(0)
    init_params = 10 * rs.randn(num_weights)

    print("Optimizing network parameters...")
    optimized_params = adam(grad(objective), init_params,
                            step_size=0.5, num_iters=100, callback=callback)


    plt.figure(2, facecolor='white')
    plt.plot(LLH_xs, LLHs)
    plt.show()