neural_network.py

import  numpy  as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.datasets import make_circles
from sklearn.model_selection import train_test_split
np.random.seed(123)

# make the datasets
X,y = make_circles(n_samples =1000,factor= 0.5,noise =0.1)
fig = plt.figure(figsize =(8,6))
plt.scatter(X[:,0],X[:,1],c=y)
plt.xlim([-1.5,1.5])
plt.ylim([-1.5,1.5])
plt.title('datasets')
plt.xlabel('First feature')
plt.ylabel('Second feature')
plt.show()


def print_shape(datasets):
	return datasets.shape

# reshape the targets to get colums vector with shape(n_sample,1)
y_true = y[:,np.newaxis]

X_train,X_test,y_train,y_test = train_test_split(X,y_true)
print("the shape of the X_train is: %s" % str(print_shape(X_train)))
print("the shape of the X_test is: %s" % str(print_shape(X_test)))
print("the shape of the y_train is: %s" % str(print_shape(y_train)))
print("the shape of the y_test is: %s" % str(print_shape(y_test)))

# Neural Network Class

class NeuralNet():
	def __init__(self,n_inputs,n_outputs,n_hidden):
		self.n_inputs = n_inputs
		self.n_outputs = n_outputs
		self.hidden = n_hidden

		# initialize weight matrices and bias vectors
		self.W_h = np.random.randn(self.n_inputs,self.hidden)
		self.b_h = np.zeros((1,self.hidden))
		self.W_o = np.random.randn(self.hidden,self.n_outputs)
		self.b_o = np.zeros((1,self.n_outputs))

	def sigmod(self,a):
		return 1/(1 + np.exp(-a))

	def forward_pass(self,X):
		"""
		propagates the given input X forward through the net
		returns:
			A_h: matrix with activations of all hidden neurons for all input examples
			o_h: matrix with outputs of all hidden neurons for all input example
			A_o: matrix with activations of all output for all input example
			O_o: matrix with outputs of all output neurons for all input example
		"""
		# compute activations and outputs of hidden units
		A_h =np.dot(X,self.W_h)+ self.b_h
		O_h = np.tanh(A_h)

		# compute activations and outputs of  output units
		A_o  = np.dot(O_h,self.W_o)+ self.b_o
		O_o = self.sigmod(A_o)

		outputs = {
				"A_h":A_h,
				"A_o":A_o,
				"O_h":O_h,
				"O_o":O_o,
		}
		return outputs

	def cost(self,y_true,y_predict,n_sample):
		# compute and return the cost over all example
		# soem cost funcion as logistic regression
		cost =(-1/n_sample)*np.sum(y_true *np.log(y_predict)+(1-y_true)*(np.log(1-y_predict)))
		cost = np.squeeze(cost)
		assert isinstance(cost,float)
		return cost
	def backward_pass(self,X,Y,n_samples,outputs):
		"""
		propagates the errors backward through the net\
		Returns:
			dW_h: partial derivatives of loss function w.r.t hidden weights
			db_h: partial derivatives of loss function w.r.t hidden bias
			dW_o: partial derivatives of loss function w.r.t output weights
			db_o: partial derivatives of loss function w.r.t output  bias 
		"""
		dA_o = (outputs['O_o']- Y)
		dW_o = (1/n_samples) *np.dot(outputs['O_h'].T,dA_o)
		db_o = (1/n_samples)* np.sum(dA_o)
		dA_h = (np.dot(dA_o,self.W_o.T))*(1-np.power(outputs['O_h'],2))
		dW_h =(1/n_samples) *np.dot(X.T,dA_h)
		db_h =(1/n_samples) *np.sum(dA_h)
		gradients = {
					"dW_o":dW_o,
					"db_o":db_o,
					"dW_h":dW_h,
					"db_h":db_h,
		}
		return gradients
	def update_weights(self,gradients,eta):
		"""
		updata the model parameters using a fixed learning rate
		"""

		self.W_o = self.W_o -eta*gradients["dW_o"]
		self.W_h = self.W_h -eta*gradients['dW_h']
		self.b_o = self.b_o - eta*gradients['db_o']
		self.b_h = self.b_h - eta*gradients['db_h']

	def train(self,X,y,n_iters = 500,eta =0.3):
		"""
		Train the neural net on the given input data
		"""
		n_samples,_ = X.shape
		for i in range(n_iters):
			outputs =self.forward_pass(X)
			cost = self.cost(y,outputs['O_o'],n_sample=n_samples)
			gradients = self.backward_pass(X,y,n_samples,outputs)
			if i %100 ==0:
				print(f'cost at iteration {i} :{np.round(cost,4)}')
			self.update_weights(gradients,eta)


	def predict(self,X):
		"""
		copmputes and returns network predictions for the given datasets
		"""
		outputs = self.forward_pass(X)
		y_predict = [1 if elem >=0.5 else 0 for elem in outputs['O_o']]
		return np.array(y_predict)[:,np.newaxis]







nn = NeuralNet(n_inputs =2,n_hidden= 6,n_outputs=1)

print("shape of weith matrices and bias vectors:")

print(f'W_h shape :{nn.W_h.shape}')
print(f'b_h  shape :{nn.b_h.shape}')
print(f'W_o shape: {nn.W_o.shape}')
print(F"b_o shape :{nn.b_o.shape}")
print("show done!!")

print("training>>>>>>>>>")
nn.train(X_train,y_train,n_iters = 10000,eta = 0.5)
		

# test 
n_test_samples,_ = X_test.shape
y_predict = nn.predict(X_test)
print(f"classification accurancy on test set:{np.sum((y_predict==y_test)/n_test_samples)*100}%")



# the 

X_temp,y_temp = make_circles(n_samples=60000,noise=0.5)
y_predict_temp = nn.predict(X_temp)
y_predict_temp= np.ravel(y_predict_temp)

fig = plt.figure(figsize=(8,12))
ax = fig.add_subplot(2,1,1)
plt.scatter(X[:,0],X[:,1],c =y)
plt.xlim([-1.5,1.5])
plt.ylim([-1.5,1.5])
plt.xlabel("First Feature")
plt.ylabel("Second Feature")
plt.title("training and testing set ")


ax = fig.add_subplot(2,1,2)
plt.scatter(X_temp[:,0],X_temp[:,1],c =y_predict_temp)
plt.xlim([-1.5,1.5])
plt.ylim([-1.5,1.5])
plt.xlabel("First Feature")
plt.ylabel("Second Feature")
plt.title("Decision boundary ")
plt.show()