machine-learning/Linear_regression/regression_example.py at master · adminho/machine-learning · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
from mpl_toolkits.mplot3d import Axes3D
from matplotlib import cm
import matplotlib.pyplot as plt
from matplotlib.ticker import LinearLocator, FormatStrFormatter

import numpy as np
import pandas as pd
from os.path import join

from sklearn import linear_model
from sklearn.metrics import mean_squared_error
from sklearn.preprocessing import StandardScaler
from sklearn.preprocessing import PolynomialFeatures
from sklearn import preprocessing
from sklearn.datasets import load_boston
from sklearn.metrics import r2_score

from scipy.stats import linregress
import tensorflow as tf

from keras.layers.core import Dense
from keras.optimizers import SGD
from keras.models import Sequential

import animation as am

def show_result(bias, weights, mse):
	print('Bias  = %s , Coefficients = %s , MSE = %s' % (bias, weights, mse))

def show_graph(X, Y, predict, title, xlabel, ylabel):
	plt.scatter(X, Y, color='b', label='data')
	plt.plot(X, predict, color='r', label='predict')
	plt.title(title)
	plt.xlabel('Years')
	plt.ylabel('Population')
	plt.show()

def add_one(data_X):
	ones =np.ones((len(data_X),1))
	# Add 1 vector to frist column
	X = np.append(ones, data_X, axis=1);
	# Wrap matrix to X, then you can use operators of the matrix
	X = np.matrix(X)
	return X

# example 1: solve eqation
def predict_example1(data_X, Y):
	X = add_one(data_X)
	C = (X.T * X).I * (X.T * Y) 			# Answer of coefficients
	#Finish training

	#Show model
	predict = X * C							# prediction
	mse = mean_squared_error(Y, predict )
	b, w = C[0], C[1:]
	show_result(b, w, mse)
	return predict

# example 2: use sklearn library
def predict_example2(X, Y):
	regr = linear_model.LinearRegression()
	regr.fit(X, Y)
	#Finish training

	#Show model
	predict = regr.predict(X)				# prediction
	mse = mean_squared_error(Y, predict)
	show_result(regr.intercept_, regr.coef_, mse)
	return predict


# example 3: use tensorflow library
def predict_example3(X, Y):
	# Try to find values for weights and bias that compute FX = W * X + B
	num_feature = X.shape[1]
	W = tf.Variable(tf.truncated_normal((num_feature, 1)))
	B = tf.Variable(tf.truncated_normal((1, 1)))
	X = X.astype(np.float32)
	FX =tf.matmul(X, W) + B

	# Minimize the mean squared errors.
	loss = tf.reduce_mean(tf.square(FX - Y))

	# Use gradient descent algorithm for optimizing
	learningRate = 0.01
	optimizer = tf.train.GradientDescentOptimizer(learningRate)
	train = optimizer.minimize(loss)

	# Before starting, initialize the variables. We will 'run' this first.
	init = tf.global_variables_initializer()

	# Launch the graph.
	sess = tf.Session()
	sess.run(init)

	# Try fit the line
	b, w, mse, predict = (None, None, None, None)
	for step in range(4000):
		_, b, w, mse, predict = sess.run([train, B, W, loss, FX])

	#Show model
	show_result(b, w ,mse )
	return predict

# Neural network
# example 4: use Keras library (1 neural)
def predict_example4(X, Y):
	model = Sequential()
	num_feature = X.shape[1]
	model.add(Dense(1, input_dim=num_feature, kernel_initializer='normal'))
	model.compile(loss='mean_squared_error', optimizer=SGD(lr=0.01))
	weights = model.layers[0].get_weights()
	model.fit(X, Y, epochs=4000, verbose=0)

	weights = model.layers[0].get_weights()
	w = weights[0]
	b = weights[1][0]

	#Show model
	predict = model.predict(X)				# prediction
	mse = mean_squared_error(Y, predict)
	show_result(b, w, mse)
	return predict

# example 5: use gradient descent algorithm (hard code without library)
def isConvergence(value):				# check condition of convergence
	return np.absolute(value) <= 0.005  	# set threshold

def isNan(value):
	if np.sum( np.isnan(value)) > 0 :
		return True

def plot_surface_error(data_X, Y): 		# for visualization
	x_range = np.arange(-5,15,1)		# -5< x-axis < 15 (increase 1 step)
	y_range = np.arange(-5,15,1)		# -5< y-axis < 15 (increase 1 step)

	w0, w1 = np.meshgrid(x_range, y_range)
	Z = np.empty(w0.shape) 	# same size as w0 and w1
	X = add_one(data_X)

	for i in x_range: 		# calculate mse of all (w0, w1) and save to Z
		for j in y_range:
			C = np.matrix( [w0[i, j] , w1[i, j]]).T
			fx = X * C
			Z[i,j] = mean_squared_error(Y, fx )

	fig = plt.figure()
	ax = fig.add_subplot(111, projection='3d')
	ax.set_xlabel('wo axis'); ax.set_ylabel('w1 axis'); ax.set_zlabel('MSE axis')
	surf = ax.plot_surface(w0, w1, Z, rstride=1, cstride=1, cmap=cm.coolwarm, linewidth=0, antialiased=False)
	# Customize the z axis.
	ax.zaxis.set_major_locator(LinearLocator(10))
	ax.zaxis.set_major_formatter(FormatStrFormatter('%.02f'))
	# Add a color bar which maps values to colors.
	fig.colorbar(surf, shrink=0.5, aspect=5)
	plt.show()

def predict_example5(data_X, Y):
	X = add_one(data_X)	                               # add one to first column
	learningRate = 0.0001				               # initial learning rate
	C = np.matrix(np.zeros(data_X.shape[1]+1)).T	   # initial coefficients
	assert C.shape == (data_X.shape[1]+1, 1)

	FX_List, Acc_List, Loss_List = [], [], [] 		# decrare empty list
	def evaluate():
		FX = X * C						# predict prices
		score = 100*r2_score(Y, FX) 		# calculate R2 score for accuracy
		MSE = mean_squared_error(Y, FX) # calculate mean squared error for loss
		#save it  for visualization later
		FX_List.append(FX)
		Acc_List.append(score)
		Loss_List.append(MSE)

	# for visualization before training
	evaluate()

	step = 0
	while(True):
		SLOPE = X.T * ( X * C - Y) 		# vector 2 x 1
		new_C = C - (learningRate * SLOPE)		# vector 2 x 1

		if isNan(SLOPE):
			print('Slope is NaN:', SLOPE)
			break

		w0, w1 = C[0,0], C[1,0]
		s0, s1 = SLOPE[0,0], SLOPE[1,0]

		C_update = np.copy(C)
		for i in range(0, len(SLOPE)):
			if isConvergence(SLOPE[i, 0]) == False: # not convergence
				C_update[i,0] = new_C[i,0]

		C = C_update		# update new coefficients include bias

		if step % 100 == 0: # for visualization later
			evaluate()
		step +=1

		# stop while_loop when all weights (coefficients) meet convergence condition
		conv = isConvergence(SLOPE)
		if np.sum(conv) == len(SLOPE):
			break

	#Finish training
	print("Total step to learning:", step)

	#Show model
	evaluate()
	b, w = C[0,0], C[1:,0]
	show_result(b, w, Loss_List[-1:])

	# For visualization finally
	FX_List = np.reshape(FX_List,(-1, X.shape[0]))
	return FX_List, Acc_List, Loss_List

########## For one input ###################
# example 6: use numpy module (polyfit)
def predict_example6(X, Y):
	X = X.reshape(-1)
	Y = Y.reshape(-1)
	w1, w0 = np.polyfit(X, Y, 1)
	#Finish training

	#Show model
	# use  broadcasting rules in numpy to add matrix
	predict = w1*X + [w0]					# prediction
	mse = mean_squared_error(Y, predict)
	show_result(w0, w1, mse)
	return predict

# example 7 : use scipy module(linregress)
def predict_example7(X, Y):
	X = X.reshape(1,-1)
	Y = Y.reshape(1,-1)
	slope, intercept, r, p, stderr = linregress(X, Y)
	#Show model
	predict = intercept + slope*X				# prediction
	mse = mean_squared_error(Y, predict)
	show_result(intercept, slope, mse)
	return predict

def prepare_dataset(csv_dataset,x_column_name, y_column_name, base_dir  = "" ):
	# read csv file with pandas module
	df = pd.read_csv(join(base_dir, csv_dataset))

	print("First of 5 row in Dataset")
	print(df.head())
	print("\nTail of 5 row in Dataset")
	print(df.tail())

	train_X = df[x_column_name].values.reshape(-1,1)		# X (Input) training set
	train_Y = df[y_column_name].values.reshape(-1,1)		# Y (Output) training set
	return train_X, train_Y

######################
#### for test only ####
def test_one_input(X, train_Y ,title, xlabel, ylabel):
	# Preprocessing data
	scaler_X = preprocessing.StandardScaler().fit(X)
	scaler_Y = preprocessing.StandardScaler().fit(train_Y)
	train_X = scaler_X.transform(X)
	train_Y = scaler_Y.transform(train_Y)
	#print(X__[0:5])
	#print(train_Y[0:5])

	assert train_X.shape == train_Y.shape

	print("\n+++++ Example 1++++")
	predict = predict_example1(train_X, train_Y)
	show_graph(X,
			scaler_Y.inverse_transform(train_Y),
			scaler_Y.inverse_transform(predict)
			,title, xlabel, ylabel)

	print("\n+++++ Example 2++++")
	predict = predict_example2(train_X, train_Y)

	print("\n+++++ Example 3++++")
	predict = predict_example3(train_X, train_Y)

	print("\n+++++ Example 4++++")
	predict = predict_example4(train_X, train_Y)

	print("\n+++++ Example 5++++")
	predictList, accuracyList, lossList = predict_example5(train_X, train_Y)
	am.visualize(X,
			scaler_Y.inverse_transform(train_Y),
			scaler_Y.inverse_transform(predictList),
			accuracyList, lossList, title=title)
	plot_surface_error(train_X, train_Y)

	print("\n+++++ Example 6++++")
	predict = predict_example6(train_X, train_Y)

	print("\n+++++ Example 7++++")
	predict = predict_example7(train_X, train_Y)

def test_polynomial(X, train_Y ,title, xlabel, ylabel):
	# Preprocessing data
	scaler_X = preprocessing.StandardScaler().fit(X)
	scaler_Y = preprocessing.StandardScaler().fit(train_Y)
	X__ = scaler_X.transform(X)
	train_Y = scaler_Y.transform(train_Y)
	#print(X__[0:5])
	#print(train_Y[0:5])

	# Generate polynomial features (2 degree).
	degree = 2 # You can change to degree 3, 4, 5 ant other at here
	poly = PolynomialFeatures(degree)
	# output for degree 2 = [1, x, x^2]
	# output for degree 3 = [1, x, x^2, x^3]
	train_X = poly.fit_transform(X__)
	#print(train_X[0:5])

	# remove 1 value from array (index 0)
	train_X = np.delete(train_X, [0], 1)
	#print(train_X[0:5])

	assert train_X.shape == (len(train_X), degree)  # (xxx, degree)
	assert train_Y.shape == (len(train_Y), 1) 		# (xxx, 1)

	print("\n+++++ Example 1++++")
	predict = predict_example1(train_X, train_Y)
	show_graph(X,
			scaler_Y.inverse_transform(train_Y),
			scaler_Y.inverse_transform(predict)
			,title, xlabel, ylabel)

	print("\n+++++ Example 2++++")
	predict = predict_example2(train_X, train_Y)

	print("\n+++++ Example 3++++")
	predict = predict_example3(train_X, train_Y)

	print("\n+++++ Example 4++++")
	predict = predict_example4(train_X, train_Y)

	print("\n+++++ Example 5++++")
	predictList, accuracyList, lossList = predict_example5(train_X, train_Y)
	am.visualize(X,
			scaler_Y.inverse_transform(train_Y),
			scaler_Y.inverse_transform(predictList),
			accuracyList, lossList, title=title)

def test_many_input(train_X, train_Y):
	scaler_X = preprocessing.StandardScaler().fit(train_X)
	scaler_Y = preprocessing.StandardScaler().fit(train_Y)
	train_X = scaler_X.transform(train_X)
	train_Y = scaler_Y.transform(train_Y)

	print("\n+++++ Example 1++++")
	predict = predict_example1(train_X, train_Y)

	print("\n+++++ Example 2++++")
	predict = predict_example2(train_X, train_Y)

	print("\n+++++ Example 3++++")
	predict = predict_example3(train_X, train_Y)

	print("\n+++++ Example 4++++")
	predict = predict_example4(train_X, train_Y)

if __name__ == '__main__':
	print("------- One input (one features) --------")
	print("++++++++ Example food truck ++++++++")
	# food_truck.csv is dataset from coursera:
	# https://www.coursera.org/learn/machine-learning teach by Andrew Ng
	X, train_Y = prepare_dataset('food_truck.csv'
									,x_column_name='population'
									,y_column_name='profit')
	test_one_input(X, train_Y, title='Food truck'
									,xlabel='Population', ylabel='Profit')
	print("\n++++++++ Example house price ++++++++")
	X, train_Y = prepare_dataset('example_price_house_40_headcolumn.csv'
									,x_column_name='area'
									,y_column_name='price')
	test_one_input(X, train_Y, title='House price'
									,xlabel='Area', ylabel='price')

	print("\n\n------- One input but many features (polynomial features) --------")
	print("++++++++ Example: Thailand population history ++++++++")
	X, train_Y = prepare_dataset('Thailand_population_history.csv'
									,x_column_name='Year'
									,y_column_name='Population')
	test_polynomial(X, train_Y, title='Thailand population'
									,xlabel='Years', ylabel='Population')

	print("\n++++++++ Example: Average income per month per household (B.E 41-58) ++++++++")
	X, train_Y = prepare_dataset('average_income_per_month_per_household_41-58.csv'
									,x_column_name='Years'
									,y_column_name='Average Monthly Income Per Household')
	test_polynomial(X, train_Y, title='Thailand monthly income'
									,xlabel='Years', ylabel='Average Monthly Income Per Household')

	print("\n\n----------- Many input ------------")
	print("++++++++++++ Example: Boston house-prices dataset +++++++++")
	boston = load_boston()
	train_X, train_Y = boston.data, boston.target
	train_Y = np.reshape(train_Y, (len(train_Y),1)) # shape: len(train_Y) x 1
	test_many_input(train_X, train_Y)