%pylab inline

Populating the interactive namespace from numpy and matplotlib

import numpy as np
import matplotlib.pyplot as plt

letters_url = ["http://mcb111.org/w08/abc.A.cat","http://mcb111.org/w08/abc.B.cat",
               "http://mcb111.org/w08/abc.C.cat","http://mcb111.org/w08/abc.D.cat",
               "http://mcb111.org/w08/abc.E.cat","http://mcb111.org/w08/abc.X.cat",
               "http://mcb111.org/w08/abc.Z.cat"]

handwritten_letters_url = ["http://mcb111.org/w08/abc.pmin0.3.pmax0.5.A.dat","http://mcb111.org/w08/abc.pmin0.3.pmax0.5.B.dat",
                           "http://mcb111.org/w08/abc.pmin0.3.pmax0.5.C.dat","http://mcb111.org/w08/abc.pmin0.3.pmax0.5.D.dat",
                           "http://mcb111.org/w08/abc.pmin0.3.pmax0.5.E.dat","http://mcb111.org/w08/abc.pmin0.3.pmax0.5.X.dat",
                           "http://mcb111.org/w08/abc.pmin0.3.pmax0.5.Z.dat"]

def load_letter(url):
    '''
    This function helps us load the data from the hand-written letters.
    input = url with data.
    output = array with each letter in a 5x5 array format.

    1st line uses np.loadtxt to load the data line by line into an array
    2nd line transforms those into 1 item per pixel
    3rd line transforms x's and dots into -1's and 1's see the documentatin of np.where to learn more!
    4th line reshapes the array into an array of 5 by 5 images of the handwritten data
    '''
    dat = np.loadtxt(url, dtype = 'str')
    dat = np.array([list(row) for row in dat])
    dat = np.where(dat =='.' , -1 ,1)
    dat = dat.reshape(len(dat.flatten())//(5*5),5,5)
    return dat

reference_A = load_letter(letters_url[0])
reference_A.shape

(10, 5, 5)

fig,ax = plt.subplots(ncols= reference_A.shape[0], nrows = 1, sharex = True)
fig.set_figwidth(35)
fig.set_figheight(5)

axs = ax.flatten()

for ax,idx in zip(axs, range(len(reference_A))):

    ax.imshow(reference_A[idx])
    ax.set_title("first example in {}".format(idx))

hand_A = load_letter(handwritten_letters_url[0])
hand_A.shape

(2000, 5, 5)

fig,ax = plt.subplots(ncols = 5, nrows = 3, sharex = True)
fig.set_figwidth(10)
fig.set_figheight(5)

axs = ax.flatten()

for ax,idx in zip(axs, range(len(hand_A[:5*3]))):

    ax.imshow(hand_A[idx])
    # ax.set_xticks(None)
    # ax.set_yticks(None)

plt.imshow(reference_A[0])

<matplotlib.image.AxesImage at 0x785336f5fc70>

reference_A[0].flatten()

array([-1, -1,  1, -1, -1, -1,  1, -1,  1, -1, -1,  1,  1,  1, -1, -1,  1,
       -1,  1, -1,  1, -1, -1, -1,  1])

w = np.zeros((25,25))
memory = reference_A[0].flatten()

w[0, 0] += 0
w[0, 1] += (memory[0]*memory[1])
w[0, 2] += (memory[0]*memory[2])
w[0, 3] += (memory[0]*memory[3])
w[0, 4] += (memory[0]*memory[4])
w[0, 5] += (memory[0]*memory[5])
w[0, 6] += (memory[0]*memory[6])
w[0, 7] += (memory[0]*memory[7])
w[0, 8] += (memory[0]*memory[8])
w[0, 9] += (memory[0]*memory[9])
w[0, 10] += (memory[0]*memory[10])
w[0, 11] += (memory[0]*memory[11])
w[0, 12] += (memory[0]*memory[12])
w[0, 13] += (memory[0]*memory[13])
w[0, 14] += (memory[0]*memory[14])
w[0, 15] += (memory[0]*memory[15])
w[0, 16] += (memory[0]*memory[16])
w[0, 17] += (memory[0]*memory[17])
w[0, 18] += (memory[0]*memory[18])
w[0, 19] += (memory[0]*memory[19])
w[0, 20] += (memory[0]*memory[20])
w[0, 21] += (memory[0]*memory[21])
w[0, 22] += (memory[0]*memory[22])
w[0, 23] += (memory[0]*memory[23])
w[0, 24] += (memory[0]*memory[24])

w[0]

array([ 0.,  1., -1.,  1.,  1.,  1., -1.,  1., -1.,  1.,  1., -1., -1.,
       -1.,  1.,  1., -1.,  1., -1.,  1., -1.,  1.,  1.,  1., -1.])

plt.imshow(w[0].reshape(5,5))

<matplotlib.image.AxesImage at 0x78532fcc4370>

w = np.zeros((25,25))
memory = reference_A[1].flatten()

w[0, 0] += 0
w[0, 1] += (memory[0]*memory[1])
w[0, 2] += (memory[0]*memory[2])
w[0, 3] += (memory[0]*memory[3])
w[0, 4] += (memory[0]*memory[4])
w[0, 5] += (memory[0]*memory[5])
w[0, 6] += (memory[0]*memory[6])
w[0, 7] += (memory[0]*memory[7])
w[0, 8] += (memory[0]*memory[8])
w[0, 9] += (memory[0]*memory[9])
w[0, 10] += (memory[0]*memory[10])
w[0, 11] += (memory[0]*memory[11])
w[0, 12] += (memory[0]*memory[12])
w[0, 13] += (memory[0]*memory[13])
w[0, 14] += (memory[0]*memory[14])
w[0, 15] += (memory[0]*memory[15])
w[0, 16] += (memory[0]*memory[16])
w[0, 17] += (memory[0]*memory[17])
w[0, 18] += (memory[0]*memory[18])
w[0, 19] += (memory[0]*memory[19])
w[0, 20] += (memory[0]*memory[20])
w[0, 21] += (memory[0]*memory[21])
w[0, 22] += (memory[0]*memory[22])
w[0, 23] += (memory[0]*memory[23])
w[0, 24] += (memory[0]*memory[24])

print(w[0])

[ 0.  1. -1.  1.  1.  1. -1.  1. -1.  1.  1. -1. -1. -1.  1.  1. -1.  1.
 -1.  1. -1.  1.  1.  1. -1.]

# transpose vector multiplied by row vector
w = np.matmul(memory[:, np.newaxis], [memory])

# set self-interaction terms to zero
np.fill_diagonal(w, 0)

# check that our method is the same as the previous
print(w[0])

[ 0  1 -1  1  1  1 -1  1 -1  1  1 -1 -1 -1  1  1 -1  1 -1  1 -1  1  1  1
 -1]

np.shape(reference_A)

(10, 5, 5)

# # HOW do we instantiate this?
# patterns = reference_A.copy()

# weights =

# for k in range(len(patterns)):
#   memory = patterns[k]
#   for m in range(memory.shape[0]):
#     for n in range(memory.shape[1]):
#       ???

N = 5
# sample array of N indices, without replacement
random_shuffling = np.random.choice(np.arange(N), N, replace=False)
print(random_shuffling)
# Then, you can shuffle X via X_shuffled=X[random_shuffling]
# And you definitely want to use the same shuffling for T, so that
# you keep the same associations between letters and their labels
# T_shuffled = T[random_shuffling]

[3 2 0 4 1]

N = 3
# make an example array
X = np.arange(N**2+N).reshape((N, N+1))
X

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11]])

# just np.ones(N) gives you an array of N ones, with shape (N,)
# the [:, np.newaxis] converts that array
# into a column vector, with shape (N,1)
ones = np.ones(N)[:, np.newaxis]
ones

array([[1.],
       [1.],
       [1.]])

# "horizontal stack" the column vector onto X:
np.hstack((ones, X))

array([[ 1.,  0.,  1.,  2.,  3.],
       [ 1.,  4.,  5.,  6.,  7.],
       [ 1.,  8.,  9., 10., 11.]])

# set iteration steps/learning rate/regularization parameters
# found after manual exploration until decent convergence
n_steps = #?
eta = #?
alpha = #?

# initialize weights as random
ws = #? whats the dimension?

# what else do we need to keep track of?
all_pred_ys = [] #predictions
losses = [] #losses

# loop through train steps
for s in range(1, n_steps):

    # current weights
    cur_w = #?
    next_w = #?

    loss = 0
    pred_ys = []

    # stochastic gradient descent
    if do_SGD:

        # 1) pick a point at random, retrieve its letter and true label
        m = #?
        Xm = #?
        tm = #?

        # 2) get predicted label
        pred_y = #?

        # 3) update weights
        next_w += #?
        pred_ys.append(pred_y)

        # 4) update loss
        loss -= #?

    # batch gradient descent
    else:

        # go through all data points
        for n in range(N_train):
            # 1) get data point and true label
            Xn = #?
            tn = #?

            # 2) get predicted label
            pred_y = #?

            # 3) update weights
            next_w += #?
            pred_ys.append(pred_y)

            # 4) update loss
            loss -= #?

    all_pred_ys.append(pred_ys)
    losses.append(loss)

    # fill in next weight
    ws[?, ?] = next_w #what indices?

all_pred_ys = np.array(all_pred_ys)
losses = np.array(losses)

# make random weights corresponding to 25 pixels, reshape to 5x5
w = np.random.normal(0, 1, 25).reshape((5,5))

# make a heatmap, positive weights are red, negative weights are blue
import seaborn as sns
plt.figure()
sns.heatmap(w, annot=True, cmap='bwr', center=0)
plt.show()

Week 8 section¶

1) Hopfield networks¶

Data¶

The weight matrix¶

But how do we actually set the weights?¶

Using matrices...¶

Remembering many patterns¶

2) Feedforward neuron model¶