%load_ext autoreload
%autoreload 2

from logreg import *
import numpy as np
import matplotlib.pyplot as plt

%matplotlib inline

data = np.load("data_logreg.npz", allow_pickle=True)
tst = data["tst"].item()
trn = data["trn"].item()

# prepare training data
raise NotImplementedError("You have to implement the rest.")
train_X = None

# Unit Test:
loss = logistic_loss(np.array([[1, 1, 1],[1, 2, 3]]), np.array([1, -1, -1]), np.array([1.5, -0.5]))

np.testing.assert_almost_equal(loss, 0.6601619507527583)

# Unit Test:
gradient = logistic_loss_gradient(X=np.array([[1, 1, 1],[1, 2, 3]]), y=np.array([1, -1, -1]), w=np.array([1.5, -0.5]))

np.testing.assert_array_almost_equal(gradient, [0.28450597, 0.82532575])

# Unit Test:
w_init = np.array([1.75, 3.4])
epsilon = 1e-2
[w, wt, Et] = logistic_loss_gradient_descent(train_X, trn['labels'], w_init, epsilon)

np.testing.assert_array_almost_equal(w, [1.8343074, 3.3190428])
np.testing.assert_array_almost_equal(wt, [[1.75, 1.75997171, 1.77782062, 1.80593719, 1.83779008, 1.84398609, 1.8343074],
                                          [3.4, 3.39233974, 3.37848624, 3.35614129, 3.32899079, 3.31724604, 3.3190428 ]])
np.testing.assert_array_almost_equal(Et, [0.25867973, 0.25852963, 0.25830052, 0.25804515, 0.25791911, 0.25791612, 0.25791452])

# Start from a fixed point:
w_init = np.array([-7, -8], dtype=np.float64)
# or start from a random point:
# w_init = 20 * (np.random.rand(2) - 0.5)
epsilon = 1e-2
[w, wt, Et] = logistic_loss_gradient_descent(train_X, trn['labels'], w_init, epsilon)

plt.figure()
plt.plot(Et)
plt.xlabel('iteration')
plt.ylabel('loss')
plt.title('Logistic regression error')
plt.grid('on')

plt.savefig('E_progress_AC.png')

# feel free to modify this function for better visualization:
plot_gradient_descent(train_X, trn['labels'], logistic_loss, w, wt, Et)
plt.savefig('w_progress_2d_AC.png')

# Unit Test:
thr = get_threshold(np.array([1.5, -0.7]))

np.testing.assert_almost_equal(thr, 2.142857142857143)

# show the aposteriori probabilities and the decision threshold
plot_aposteriori(train_X, trn['labels'], w)
plt.savefig('aposteriori.png')

# Unit Test:
y = classify_images(np.array([[1, 1, 1, 1, 1, 1, 1],[0.5, 1, 1.5, 2, 2.5, 3, 3.5]]), np.array([1.5, -0.5]))

np.testing.assert_array_equal(y, [1, 1, 1, 1, 1, -1, -1])

# Load test letter data
raise NotImplementedError("You have to implement the rest.")
testX = None

# Classify letter test data and calculate classification error
classifiedLabels = classify_images(testX, w)
raise NotImplementedError("You have to implement the rest.")
errors = None
testError = np.sum(errors, dtype=np.float64) / errors.size
print('Letter classification error: {:.2f}%'.format(testError * 100))

Letter classification error: 7.00%

show_classification(tst['images'], classifiedLabels, 'CA')
plt.savefig('classif_AC.png')

# Load training data
data = np.load("mnist_trn.npz", allow_pickle=True)
X, y, imsize = data["X"], data["y"], data["imsize"]

# Add x0 = 1 (for the bias term)
raise NotImplementedError("You have to implement the rest.")
X = None
# Training - gradient descent of the logistic loss function

np.random.seed(1) # to get the same example outputs
w_init = np.random.rand(X.shape[0])
epsilon = 1e-2

w, _, Et = logistic_loss_gradient_descent(X, y, w_init, epsilon)

# Plot the progress of the gradient descent
plt.figure()
plt.plot(Et)
plt.xlabel('iteration')
plt.ylabel('loss')
plt.title('Logistic regression error')
plt.grid('on')

plt.savefig('E_progress_MNIST.png')

# Load test data
data = np.load("mnist_tst.npz", allow_pickle=True)
X, y, imsize = data["X"], data["y"], data["imsize"]

raise NotImplementedError("You have to implement the rest.")
X = None

# Classify MNIST test data and calculate classification error
classifiedLabels = classify_images(X, w)
errors = None

testError = np.sum(errors, dtype=np.float64) / errors.size
print('MNIST digit classification error: {:.2f}%'.format(testError * 100))

MNIST digit classification error: 0.10%

# Visualize classification results
show_mnist_classification(X[1:, :], classifiedLabels, imsize)
plt.savefig('classif_MNIST.png')

w_img = w[1:].reshape(imsize)
vmax = np.max(np.abs(w_img))
# https://matplotlib.org/stable/users/explain/colors/colormaps.html#diverging
sm = plt.imshow(w_img, cmap='bwr', vmin=-vmax, vmax=vmax)
plt.colorbar(sm)
plt.axis('off')
plt.title('Weights visualization')
plt.savefig('weight_image.png')

RPZ Assignment: Logistic Regression¶

Introduction¶

Part 1: Letter classification¶

Load data¶

Gradient descent optimization¶

Visualize the progress of the gradient descent¶

Preparation for classification¶

Image classification¶

Visualize classification results¶

Part 2: MNIST digit classification¶

Load the data¶

Prepare the data¶

Train the classifier¶

Plot the training progress¶

Classify the test data and calculate the classification error¶

Visualize the MNIST classification¶

Examining the feature weights¶

Submission to the BRUTE Upload System¶

Bonus task¶

References¶