import numpy as np 
def sigmoid(x):
    return 1 / (1 + np.exp(-1 * x))

def forward(weights, bias, x):
    x = x + 1e-10
    out = sigmoid(np.dot(weights.T, x) + bias)[0][0]
    return out, int(out > 0.5)


def backpropagate(x, y, weights, bias, learning_rate):
    x = x + 1e-10
    y = y + 1e-10
    # caculate prediction
    out_1 = np.dot(weights.T, x) + bias
    out_2 = sigmoid(out_1)
    # calculate error
    error_1 = out_2 - y
    error_2 = np.square(error_1)
    # Gradient Descent Step
    dE_dy = 2 * error_1
    dsigma_dout1 = out_2 * (1 - out_2)
    # calculate gradient of error w.r.t weights
    dE_dW = dE_dy * dsigma_dout1 * x
    # calculate new weights
    new_w = weights - learning_rate * error_2 * dE_dW
    # calculate gradient of error w.r.t bias
    dE_db = dE_dy * dsigma_dout1 * 1
    # calculate new biases 
    new_b = bias - learning_rate * error_2 * dE_db
    
    return new_w, new_b


def train(data, epochs=150):
    weights_shape, bias_shape = (2,1), (1,)
    weights = np.zeros(weights_shape) + 1e-2
    bias = np.zeros(bias_shape)
    learning_rate = .1

    for _ in range(epochs):
        for batch in data:
            x = np.array(batch[:2])[:, None]
            y = np.array(batch[ 2])
            weights, bias = backpropagate(x, y, 
                                          weights, 
                                          bias,
                                          learning_rate)
    return weights, bias


and_gate_data = [(0,0,0), (0,1,0), (1,0,0), (1,1,1)]
print("AND Gate:")
print("\ta\tb\toutput\n{}".format('\t' + '\n\t'.join(['\t'.join([str(j) for j in i]) for i in and_gate_data])))

print("\nWeights and Biases:")
weights, bias = train(and_gate_data)
print(f'\tWeights: {weights[:,0]}')
print(f'\tBias: {bias[0]}')

print("\nPredictions:")
for (a, b, c) in and_gate_data:
    raw_pred, pred = forward(weights, bias, np.array([[a],[b]]))
    print(f'\tInput: {[a,b]}\t'
          f'\tTruth: {c}\t'
          f'\tPrediction: {round(raw_pred,6)} => {pred}')

AND Gate:
	a	b	output
	0	0	0
	0	1	0
	1	0	0
	1	1	1

Weights and Biases:
	Weights: [0.39349878 0.39069549]
	Bias: [-0.71500872]

Predictions:
	Input: [0, 0]		Truth: 0		Prediction: 0.328493 => 0
	Input: [0, 1]		Truth: 0		Prediction: 0.419625 => 0
	Input: [1, 0]		Truth: 0		Prediction: 0.420308 => 0
	Input: [1, 1]		Truth: 1		Prediction: 0.517289 => 1


or_gate_data = [(0,0,0), (0,1,1), (1,0,1), (1,1,1)]
print("AND Gate:")
print("\ta\tb\toutput\n{}".format('\t' + '\n\t'.join(['\t'.join([str(j) for j in i]) for i in or_gate_data])))

print("\nWeights and Biases:")
weights, bias = train(or_gate_data)
print(f'\tWeights: {weights[:,0]}')
print(f'\tBias: {bias[0]}')

print("\nPredictions:")
for (a, b, c) in or_gate_data:
    raw_pred, pred = forward(weights, bias, np.array([[a],[b]]))
    print(f'\tInput: {[a,b]}\t'
          f'\tTruth: {c}\t'
          f'\tPrediction: {round(raw_pred,6)} => {pred}')

AND Gate:
	a	b	output
	0	0	0
	0	1	1
	1	0	1
	1	1	1

Weights and Biases:
	Weights: [0.62831802 0.62989494]
	Bias: [-0.02036241]

Predictions:
	Input: [0, 0]		Truth: 0		Prediction: 0.49491 => 0
	Input: [0, 1]		Truth: 1		Prediction: 0.647834 => 1
	Input: [1, 0]		Truth: 1		Prediction: 0.647474 => 1
	Input: [1, 1]		Truth: 1		Prediction: 0.77519 => 1


xor_gate_data = [(0,0,0), (0,1,1), (1,0,1), (1,1,0)]
weights, bias = train(xor_gate_data, epochs=50000)
print(f'Weights: {weights[:,0]}')
print(f'Bias: {bias[0]}\n')
for (a, b, c) in and_gate_data:
    raw_pred, pred = forward(weights, bias, np.array([[a],[b]]))
    print(f'Input: {[a,b]}\t'
          f'Truth: {c}\t'
          f'Pred: {round(raw_pred,6)} => {pred}')

Weights: [-0.01261855 -0.00630927]
Bias: [0.00630927]

Input: [0, 0]	Truth: 0	Pred: 0.501577 => 1
Input: [0, 1]	Truth: 0	Pred: 0.5 => 1
Input: [1, 0]	Truth: 0	Pred: 0.498423 => 0
Input: [1, 1]	Truth: 1	Pred: 0.496845 => 0

A Gentle Intro to Backpropagation in Neural Networks¶

AND/OR Gate Perceptron Approximator¶

Gradient Descent¶

Let's generate and train some weights¶

Let's train and test our perceptron on an AND Gate¶

Let's try an OR Gate¶

Limitations of Perceptrons¶