Backprop_Implementation/Backprop.py at master · Alok991/Backprop_Implementation · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
# Author : Alok Dixit
# Date : 24-may-2018

"""
Objective: To implement a Backprop demo
            1. We should be able to specify the number of layers in Neural net
            2. A list of number of neurons in each layer
            3. We should be able to specify the activation function
"""

import numpy as np
import pandas as pd
import math

# +1 for bias node
INPUT_LAYER_DIM = 2 + 1
HIDDEN_LAYER_DIM = 3
OUTPUT_LAYER_DIM = 1

NUM_OF_HIDDEN_LAYERS = 2

NUM_OF_ITERATION = 10000


# Learning Rate
alpha = 0.01

momentum = 0.01

activation_function = None
activation_grad = None


def nearest_int(x):
    return 1 if x>0.5 else 0

def tanh(input):
    return np.array([math.tanh(inp) for inp in input])

def tanh_grad(input):
    return np.array([(1.0 - inp**2) for inp in input])

def RELU(input):
    return [x if x>0 else 0 for x in input]

def RELU_grad(input):
    return [1 if x>0 else 0 for x in input]

activation_function = tanh
activation_grad = tanh_grad

df = pd.read_csv("DATA.csv")

input_xy = [(x,y, 1) for x, y in zip(df["x"], df["y"])]
label_z = df["z"]

# This will store the output of activation function of neurons
input_out = np.zeros(shape=(INPUT_LAYER_DIM))+1
hidden_out = np.zeros(shape=(NUM_OF_HIDDEN_LAYERS, HIDDEN_LAYER_DIM))+1
output_out = np.zeros(shape=(OUTPUT_LAYER_DIM))+1


def make_random_array(a, *b):
    return np.random.randint(-100,100, size=(a,*b)).astype(np.float)/100


# These are the weights between layers

# w[0] = first neuron of input layer to all neurons on hidden layer
w_i_h1 = make_random_array(INPUT_LAYER_DIM, HIDDEN_LAYER_DIM)

# w[0] = 2D matrix of weights between hi and hj hidden layers
w_hi_hj = make_random_array(NUM_OF_HIDDEN_LAYERS-1, HIDDEN_LAYER_DIM, HIDDEN_LAYER_DIM)

# w[0] = first neuron of hidden layer to all neurons on output layer
w_h_o = make_random_array(HIDDEN_LAYER_DIM, OUTPUT_LAYER_DIM)

# c[0] = first neuron of input layer to all neurons on hidden layer
c_i_h1 = make_random_array(INPUT_LAYER_DIM, HIDDEN_LAYER_DIM)

# c[0] = 2D matrix of weights between hi and hj hidden layers
c_hi_hj = make_random_array(NUM_OF_HIDDEN_LAYERS-1, HIDDEN_LAYER_DIM, HIDDEN_LAYER_DIM)

# c[0] = first neuron of hidden layer to all neurons on output layer
c_h_o = make_random_array(HIDDEN_LAYER_DIM, OUTPUT_LAYER_DIM)


print("Learning...")
for i in range(NUM_OF_ITERATION):
    alpha = alpha/(i+1)
    for j, inp in enumerate(input_xy):
        # output of input layer(same as input to network)
        label = label_z[j]
        input_out = np.array(inp)

        # output of hidden layers
        for k, hidden_layer in enumerate(hidden_out):
            if k == 0:
                # out hidden_layer 1
                hidden_out[k] = activation_function((input_out.dot(w_i_h1)))
            else:
                hidden_out[k] = activation_function((hidden_out[k-1].dot(w_hi_hj[k-1])))

        # output of last layer
        output_out = activation_function(hidden_out[-1].dot(w_h_o))

        """
        BACKPROPOGATION START HERE !!
        """
        hidden_delta = []
        # error delta for output layer
        err = output_out - label
        output_delta = activation_grad(output_out)*err

        # error delta for hidden layers
        next_layer_delta = output_delta
        for k, hidden_layer in enumerate(reversed(hidden_out)):
            k = len(hidden_out) - k - 1
            # last hidden layer
            if k == len(hidden_out)-1:
                err = next_layer_delta.dot(w_h_o.T)
            else:
                err = next_layer_delta.dot(w_hi_hj[k].T)

            this_hidden_layer_delta = activation_grad(hidden_out[k])*err
            next_layer_delta = this_hidden_layer_delta
            hidden_delta.insert(0, this_hidden_layer_delta)

        hidden_delta = np.array(hidden_delta)

        # update the intput weights ==> w_i_h1
        w_i_h1 = w_i_h1 - momentum*c_i_h1 - alpha*(input_out.reshape((-1,1)).dot(hidden_delta[0].reshape((1,-1))))
        c_i_h1 = input_out.reshape((-1,1)).dot(hidden_delta[0].reshape((1,-1)))

        # update inter-hidden layer weights
        for k in range(len(w_hi_hj)):
            w_hi_hj[k] = w_hi_hj[k] - momentum*c_hi_hj[k] - alpha*((hidden_out[k].T).dot(hidden_delta[k]))
            c_hi_hj[k] = (hidden_out[k].T).dot(hidden_delta[k])
    if i%1000 == 0 :
        print("iteration {0} completed".format(i))


print("After Learning...")
for j, inp in enumerate(input_xy):
    # output of input layer(same as input to network)
    label = label_z[j]
    input_out = np.array(inp)

    # output of hidden layers
    for k, hidden_layer in enumerate(hidden_out):
        if k == 0:
            # out hidden_layer 1
            hidden_out[k] = activation_function((input_out.dot(w_i_h1)))
        else:
            hidden_out[k] = activation_function((hidden_out[k-1].dot(w_hi_hj[k-1])))

    # output of last layer
    output_out = (hidden_out[-1].dot(w_h_o))
    err = output_out - label
    print("Expected output => {0}, Real output => {1}".format(label, nearest_int(output_out)))


# https://mattmazur.com/2015/03/17/a-step-by-step-backpropagation-example/