7a96330d4d71c198401f4800b9754565e26bd454 to ce103dfd82d0474f0b848c628f50ef12112f5f7e · Audard Lucile / Image classification

knn.py

+9 −19

Original line number	Diff line number	Diff line
		@@ -43,35 +43,25 @@ def evaluate_knn(data_train, labels_train, data_test, labels_test, k):
		return accuracy








		if __name__ == "__main__":

		# Extraction of the data from Cifar database
		data, labels = read_cifar("./data/cifar-10-batches-py")

		# Formatting the data into training and testing sets
		data_train, labels_train, data_test, labels_test = split_dataset(data, labels, 0.9)

		# Data to plot
		k_list = [k for k in range(1, 21)]
		accuracy = [evaluate_knn(data_train, labels_train, data_test, labels_test, k) for k in range (1, 21)]

		# Plot the graph
		plt.close()
		plt.plot(k_list, accuracy)
		plt.title("Variation of k-nearest neighbors method accuracy for k from 1 to 20")
		plt.xlabel("k value")
		plt.ylabel("Accuracy")
		plt.grid(True, which='both')
		plt.savefig("results/knn.png")


		# x_test = np.array([[1,2],[4,6]])
		# x_labels_test = np.array([0,1])
		# x_train = np.array([[2,4],[7,2],[4,6]])
		# x_labels_train = np.array([0,1,1])

		# dist = distance_matrix(x_test, x_train)
		# accuracy = evaluate_knn(x_train, x_labels_train, x_test, x_labels_test, 1)
		# print(accuracy)

		plt.show()
		#plt.savefig("results/knn.png")

mlp.py

+29 −21

Original line number	Diff line number	Diff line
		@@ -11,16 +11,16 @@ def learn_once_mse(w1, b1, w2, b2, data, targets, learning_rate):
		# Forward pass
		a0 = data # the data are the input of the first layer
		z1 = np.matmul(a0, w1) + b1 # input of the hidden layer
		a1 = 1 / (1 + np.exp(-z1)) # output of the hidden layer (sigmoid activation function)
		a1 = sigmoid(z1) # output of the hidden layer (sigmoid activation function)
		z2 = np.matmul(a1, w2) + b2 # input of the output layer
		a2 = 1 / (1 + np.exp(-z2)) # output of the output layer (sigmoid activation function)
		a2 = sigmoid(z2) # output of the output layer (sigmoid activation function)
		predictions = a2 # the predicted values are the outputs of the output layer

		# Compute loss (MSE)
		loss = np.mean(np.square(predictions - targets))

		# According to the formulas established by theory :
		d_a2 = 2 / N * (1 - targets)
		d_a2 = 2 / N * (a2 - targets)
		d_z2 = d_a2 * a2 * (1 - a2)
		d_w2 = np.matmul(a1.T, d_z2)
		d_b2 = d_z2
		@@ -46,30 +46,36 @@ def one_hot(labels):
		return one_hot_matrix


		def softmax(x):
		e_x = np.exp(x - np.max(x)) # Subtracting the maximum value for numerical stability
		return e_x / e_x.sum(axis=0)


		def learn_once_cross_entropy(w1, b1, w2, b2, data, labels_train, learning_rate):
		N = len(labels_train) # number of training examples

		# Forward pass
		a0 = data # the data are the input of the first layer
		z1 = np.matmul(a0, w1) + b1 # input of the hidden layer
		a1 = 1 / (1 + np.exp(-z1)) # output of the hidden layer (sigmoid activation function)
		a1 = sigmoid(z1) # output of the hidden layer (sigmoid activation function)
		z2 = np.matmul(a1, w2) + b2 # input of the output layer
		a2 = 1 / (1 + np.exp(-z2)) # output of the output layer (sigmoid activation function)
		a2 = softmax(z2) # output of the output layer (softmax activation function)
		predictions = a2 # the predicted values are the outputs of the output layer

		targets_one_hot = one_hot(labels_train) # target as a one-hot encoding for the desired labels

		# Cross-entropy loss
		loss = -np.sum(targets_one_hot * np.log(predictions)) / N
		epsilon = 0.00001
		loss = - np.sum(targets_one_hot * np.log(predictions + epsilon)) / N

		# Backpropagation
		d_z2 = a2 - targets_one_hot
		d_w2 = np.dot(a1.T, d_z2) / N
		d_b2 = d_z2 / N
		d_b2 = np.sum(d_z2, axis = 0, keepdims = True) / N
		d_a1 = np.dot(d_z2, w2.T)
		d_z1 = d_a1 * z1 * (1 - a1)
		d_w1 = np.dot(a0.T, d_z1) / N
		d_b1 = d_z1 / N
		d_b1 = np.sum(d_z1, axis = 0, keepdims = True) / N

		# Calculation of the updated weights and biases of the network with gradient descent method
		w1 -= learning_rate * d_w1
		@@ -88,9 +94,9 @@ def train_mlp(w1, b1, w2, b2, data_train, labels_train, learning_rate, num_epoch
		# Forward pass
		a0 = data_train # the data are the input of the first layer
		z1 = np.matmul(a0, w1) + b1 # input of the hidden layer
		a1 = 1 / (1 + np.exp(-z1)) # output of the hidden layer (sigmoid activation function)
		a1 = sigmoid(z1) # output of the hidden layer (sigmoid activation function)
		z2 = np.matmul(a1, w2) + b2 # input of the output layer
		a2 = 1 / (1 + np.exp(-z2)) # output of the output layer (sigmoid activation function)
		a2 = softmax(z2) # output of the output layer (softmax activation function)
		predictions = a2 # the predicted values are the outputs of the output layer

		# Find the predicted class
		@@ -108,9 +114,9 @@ def test_mlp(w1, b1, w2, b2, data_test, labels_test):
		# Forward pass
		a0 = data_test # the data are the input of the first layer
		z1 = np.matmul(a0, w1) + b1 # input of the hidden layer
		a1 = 1 / (1 + np.exp(-z1)) # output of the hidden layer (sigmoid activation function)
		a1 = sigmoid(z1) # output of the hidden layer (sigmoid activation function)
		z2 = np.matmul(a1, w2) + b2 # input of the output layer
		a2 = 1 / (1 + np.exp(-z2)) # output of the output layer (sigmoid activation function)
		a2 = softmax(z2) # output of the output layer (softmax activation function)
		predictions = a2 # the predicted values are the outputs of the output layer

		# Find the predicted label
		@@ -128,10 +134,10 @@ def run_mlp_training(data_train, labels_train, data_test, labels_test, d_h, lear
		d_in = data_train.shape[1] # number of input neurons
		d_out = len(np.unique(labels_train)) # number of output neurons = number of classes

		# Random initialization of the network weights and biaises
		w1 = 2 * np.random.rand(d_in, d_h) - 1 # first layer weights
		# Random initialization of the network weights and biaises with Xavier initialisation
		w1 = np.random.randn(d_in, d_h) / np.sqrt(d_in) # first layer weights
		b1 = np.zeros((1, d_h)) # first layer biaises
		w2 = 2 * np.random.rand(d_h, d_out) - 1 # second layer weights
		w2 = np.random.randn(d_h, d_out) / np.sqrt(d_h) # second layer weights
		b2 = np.zeros((1, d_out)) # second layer biaises

		# Training of the MLP classifier with num_epoch steps
		@@ -145,26 +151,28 @@ def run_mlp_training(data_train, labels_train, data_test, labels_test, d_h, lear

		if __name__ == "__main__":

		# Parameters
		split_factor = 0.9
		d_h = 64
		learning_rate = 0.1
		num_epoch = 100

		# Extraction and formatting of the data from Cifar database
		data, labels = read_cifar("./data/cifar-10-batches-py")
		data_train, labels_train, data_test, labels_test = split_dataset(data, labels, split_factor)

		# Initialisation of the data to plot
		epochs = [i for i in range(1, num_epoch + 1)]
		learning_accuracy = [0] * num_epoch

		for i in range(num_epoch) :
		train_accuracies, test_accuracy = run_mlp_training(data_train, labels_train, data_test, labels_test, d_h, learning_rate, i + 1)
		learning_accuracy[i] = test_accuracy
		train_accuracies, test_accuracy = run_mlp_training(data_train, labels_train, data_test, labels_test, d_h, learning_rate, num_epoch)

		plt.plot(epochs, learning_accuracy)
		# Plot the graph
		plt.close()
		plt.plot(epochs, train_accuracies)
		plt.title("Evolution of learning accuracy across learning epochs")
		plt.xlabel("number of epochs")
		plt.ylabel("Accuracy")
		plt.grid(True, which='both')
		plt.show()
		plt.savefig("results/mlp.png")

read_cifar.py

+31 −4

Original line number	Diff line number	Diff line
		import pickle
		import numpy as np
		from sklearn.model_selection import train_test_split
		import random


		def unpickle(file):
		@@ -7,29 +9,54 @@ def unpickle(file):
		batch = pickle.load(fo, encoding='bytes')
		return batch


		def read_cifar_batch(path):
		batch = unpickle(path)
		data = batch[b'data']
		labels = batch[b'labels']
		return np.float32(data), np.int64(labels)


		def read_cifar(folder_path):

		# Get the test batch
		data, labels = read_cifar_batch("./data/cifar-10-batches-py/test_batch")

		# Concatenate with the 5 data batches
		for i in range(1,5):
		data = np.concatenate((data, read_cifar_batch(folder_path + "/data_batch_" + str(i))[0]))
		labels = np.concatenate((labels, read_cifar_batch(folder_path + "/data_batch_" + str(i))[1]))
		np.append(data, read_cifar_batch(folder_path + "/data_batch_" + str(i))[0])
		np.append(labels, read_cifar_batch(folder_path + "/data_batch_" + str(i))[1])

		return data, labels


		def split_dataset(data, labels, split):

		# Determination of an index to split the data
		index = int(split * len(data))
		data_train, data_test = np.split(data, index)
		labels_train, labels_test = np.split(labels, index)

		# Split the data on the index
		tableau_combine = list(zip(data, labels))
		random.shuffle(tableau_combine)
		data_train, data_test, labels_train, labels_test = train_test_split(data, labels, test_size=1-split, random_state=1)
		# data_train, data_test = np.split(data, [index])
		# labels_train, labels_test = np.split(labels, [index])
		return data_train, labels_train, data_test, labels_test



		if __name__ == "__main__":

		# Extraction of the data from Cifar database
		data, labels = read_cifar("./data/cifar-10-batches-py")
		print(data)
		print(labels)

		# Formatting the data into training and testing sets
		split = 0.21
		data_train, labels_train, data_test, labels_test = split_dataset(data, labels, split)
		print(data_train)
		print(labels_train)
		print(data_test)
		print(labels_test)

results/knn.png

0 → 100644

+39.4 KiB

39.45 KiB

results/mlp.png

0 → 100644

+29.6 KiB

29.58 KiB

Compare revisions

Source

Target

Commits on Source 9

Files

knn.py

mlp.py

read_cifar.py

results/knn.png

results/mlp.png