forked from jhoward/Python-Neural-Network
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathnn.py
More file actions
252 lines (193 loc) · 6.94 KB
/
nn.py
File metadata and controls
252 lines (193 loc) · 6.94 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
"""
Pure Python implementation of a Back-Propagation Neural Network using the
hyperbolic tangent as the sigmoid squashing function.
Original Author: Neil Schemenauer <nas@arctrix.com>
Modified Author: James Howard <james.w.howard@gmail.com>
Modified to work for function regression and added option to use matplotlib
to display regression networks.
Code is placed in public domain.
"""
import math
import random
random.seed(0)
# calculate a random number where: a <= rand < b
def rand(a, b):
return (b-a)*random.random() + a
# Make a matrix (we could use NumPy to speed this up)
def makeMatrix(I, J, fill=0.0):
m = []
for i in range(I):
m.append([fill]*J)
return m
# our sigmoid function, tanh is a little nicer than the standard 1/(1+e^-x)
def sigmoid(x):
return math.tanh(x)
# derivative of our sigmoid function, in terms of the output (i.e. y)
def dsigmoid(y):
return 1.0 - y**2
def plot(inputs, outputs, actual):
"""Plot a given function.
The actual function will be plotted with a line and the outputs with
points. Useful for visualizing the error of the neural networks attempt
at function interpolation."""
try:
import matplotlib.pyplot
except:
raise ImportError, "matplotlib package not found."
fig = matplotlib.pyplot.figure()
ax1 = fig.add_subplot(111)
ax1.plot(inputs, actual, 'b-')
ax1.plot(inputs, outputs, 'r.')
matplotlib.pyplot.draw()
class NN:
def __init__(self, ni, nh, no, regression = False):
"""NN constructor.
ni, nh, no are the number of input, hidden and output nodes.
regression is used to determine if the Neural network will be trained
and used as a classifier or for function regression.
"""
self.regression = regression
#Number of input, hidden and output nodes.
self.ni = ni + 1 # +1 for bias node
self.nh = nh + 1 # +1 for bias node
self.no = no
# activations for nodes
self.ai = [1.0]*self.ni
self.ah = [1.0]*self.nh
self.ao = [1.0]*self.no
# create weights
self.wi = makeMatrix(self.ni, self.nh)
self.wo = makeMatrix(self.nh, self.no)
# set them to random vaules
for i in range(self.ni):
for j in range(self.nh):
self.wi[i][j] = rand(-1, 1)
for j in range(self.nh):
for k in range(self.no):
self.wo[j][k] = rand(-1, 1)
# last change in weights for momentum
self.ci = makeMatrix(self.ni, self.nh)
self.co = makeMatrix(self.nh, self.no)
def update(self, inputs):
if len(inputs) != self.ni-1:
raise ValueError, 'wrong number of inputs'
# input activations
for i in range(self.ni - 1):
self.ai[i] = inputs[i]
# hidden activations
for j in range(self.nh - 1):
total = 0.0
for i in range(self.ni):
total += self.ai[i] * self.wi[i][j]
self.ah[j] = sigmoid(total)
# output activations
for k in range(self.no):
total = 0.0
for j in range(self.nh):
total += self.ah[j] * self.wo[j][k]
self.ao[k] = total
if not self.regression:
self.ao[k] = sigmoid(total)
return self.ao[:]
def backPropagate(self, targets, N, M):
if len(targets) != self.no:
raise ValueError, 'wrong number of target values'
# calculate error terms for output
output_deltas = [0.0] * self.no
for k in range(self.no):
output_deltas[k] = targets[k] - self.ao[k]
if not self.regression:
output_deltas[k] = dsigmoid(self.ao[k]) * output_deltas[k]
# calculate error terms for hidden
hidden_deltas = [0.0] * self.nh
for j in range(self.nh):
error = 0.0
for k in range(self.no):
error += output_deltas[k]*self.wo[j][k]
hidden_deltas[j] = dsigmoid(self.ah[j]) * error
# update output weights
for j in range(self.nh):
for k in range(self.no):
change = output_deltas[k]*self.ah[j]
self.wo[j][k] = self.wo[j][k] + N*change + M*self.co[j][k]
self.co[j][k] = change
# update input weights
for i in range(self.ni):
for j in range(self.nh):
change = hidden_deltas[j]*self.ai[i]
self.wi[i][j] = self.wi[i][j] + N*change + M*self.ci[i][j]
self.ci[i][j] = change
# calculate error
error = 0.0
for k in range(len(targets)):
error += 0.5*((targets[k]-self.ao[k])**2)
return error
def test(self, patterns, verbose = False):
tmp = []
for p in patterns:
if verbose:
print p[0], '->', self.update(p[0])
tmp.append(self.update(p[0]))
return tmp
def weights(self):
print 'Input weights:'
for i in range(self.ni):
print self.wi[i]
print
print 'Output weights:'
for j in range(self.nh):
print self.wo[j]
def train(self, patterns, iterations=1000, N=0.5, M=0.1, verbose = False):
"""Train the neural network.
N is the learning rate.
M is the momentum factor.
"""
for i in xrange(iterations):
error = 0.0
for p in patterns:
self.update(p[0])
tmp = self.backPropagate(p[1], N, M)
error += tmp
if i % 100 == 0:
print 'error %-14f' % error
def demoRegression():
data = []
inputs = []
actual = []
domain = [-1, 1]
steps = 50
stepsize = (domain[1] - domain[0]) / ((steps - 1)*1.0)
#Teach the network the function y = x**2
for i in range(steps):
x = domain[0] + stepsize * i
y = x**2
data.append([[x], [y]])
inputs.append(x)
actual.append(y)
n = NN(1, 4, 1, regression = True)
#Train and test the nural network.
n.train(data, 1000, 0.2, 0.1, False)
outputs = n.test(data, verbose = True)
#Plot the function.
try:
plot(inputs, outputs, actual)
print "Press a key to quit."
value = raw_input()
except:
print "Must have matplotlib to plot."
def demoClassification():
# Teach network XOR function
pat = [
[[0,0], [0]],
[[0,1], [1]],
[[1,0], [1]],
[[1,1], [0]]
]
# create a network with two input, two hidden, and one output nodes
n = NN(2, 2, 1, regression = False)
# train it with some patterns then test it.
n.train(pat, 1000, 0.5, 0.2)
n.test(pat, verbose = True)
if __name__ == '__main__':
#demoRegression()
demoClassification()