Add files via upload

laurence-lin · Jan 12, 2018 · 6b495fb · 6b495fb
1 parent 36da624
commit 6b495fb
Show file tree

Hide file tree

Showing 2 changed files with 207 additions and 0 deletions.
diff --git a/IBM training set result.png b/IBM training set result.png
diff --git a/RBF.py b/RBF.py
@@ -0,0 +1,207 @@
+import numpy as np
+from numpy.linalg import norm
+import matplotlib.pyplot as plt
+import math
+import pandas as pd
+import random as rd
+plt.close('all')
+
+'''IBM stock data'''
+IBM = pd.read_csv('IBM_stock_close_price.csv')
+ibm = np.array(IBM)
+plt.figure(7)
+plt.plot(ibm[:,1])
+plt.title('IBM close price 1961~1962')
+plt.xlabel('days')
+plt.ylabel('close price')
+
+Max = max(IBM.iloc[:,1])
+Min = min(IBM.iloc[:,1])
+
+for i in range(ibm.shape[0]):
+    ibm[i,1] = (ibm[i,1] - Min) / (Max - Min)
+
+ibm_train = ibm[0:250,1]
+ibm_test = ibm[250:,1]
+
+
+'''initialized center'''
+Xmax = 1
+Xmin = 0
+hidden_neuron = 15; '''hidden neuron for encoding to a single input variable'''
+center = []
+for neuron in range(hidden_neuron):
+    center.append( Xmin + (Xmax - Xmin)/(2*hidden_neuron) + (neuron - 1)*((Xmax - Xmin)/hidden_neuron) )
+    center[neuron] = float('%.4f' % center[neuron]) # get float number by 4 decimal point
+    '''10 RBF centers'''
+
+print('Initial center =', center)
+#dmax = (2*(hidden_neuron-1) - 1)/(2*hidden_neuron)
+dmax = max(center) - min(center)
+width = dmax/(2*hidden_neuron)**0.5
+Width = width*np.ones((1,hidden_neuron)) # width array for optimization
+beta = - 1 / (2 * (width ** 2))
+delta = width*np.ones((hidden_neuron,1))
+
+class RBFNN:
+
+    def __init__(self, n_input, n_hidden, w_in_hidden = None, w_out = None):
+        self.n_input = n_input  # practically, input neurons depend on sample features. Set up first is unnecessary
+        self.n_hidden = n_hidden
+        self.w_in_hidden = w_in_hidden  # usually set = 1
+        '''3 parameters to be optimized during iteration, thus give them self attribute'''
+        self.w_out = w_out  # randomly initialized weight
+        self.center = center
+        self.delta = delta
+        self.output = []
+        self.hidden_out = []
+
+    def gaussian(self, input, Center):  # calculate 1 * 5 array input mapping to 10 * 5 output matrix
+        '''input x dimension = number of features'''
+        encode_neuron = self.n_hidden
+        '''I don't know how to set the width theoretically'''
+        hidden_out = np.zeros((encode_neuron, 1))  # 10*1 matrix
+        for j in range(encode_neuron):
+            hidden_out[j, 0] = np.exp(-self.Euclidean(input, Center[j]) ** 2 / 2 * (self.delta[j] ** 2))
+
+        return hidden_out  # 10 outputs of hidden neuron
+
+    def Euclidean(self, a, b):
+        return norm(a - b)  # return euclidean distance of 2 vector
+
+    def HiddenLayer(self, input):
+        centroid = self.center
+        hidden_output = self.gaussian(input,centroid)  # hidden neurons output of 1 input sample
+        self.hidden_out = hidden_output
+        return hidden_output # 10*1 matrix
+
+    def feed_forward(self, input):  # feed forward calculation from input to output layer, calculate one sample at a time
+        hidden_out = self.HiddenLayer(input) # 10*1 array
+        weight = self.w_out # 1*10 array
+        output = np.dot(weight, hidden_out)
+        return output # output value of single sample
+
+    def train(self, train_sample, sample_target):
+
+        # Gradient descent learning: weight, center, width
+        # update self attribute, keep the update to next iteration
+        # Weight update:
+        lr = 0.2  # learning rate
+        num_hidden = self.n_hidden
+
+        samples = train_sample.shape[0]
+        w_gradient = np.zeros((num_hidden, 1))
+        c_gradient = np.zeros((num_hidden, 1))
+        delta_gradient = np.zeros((num_hidden, 1))
+        beta = np.zeros((num_hidden,1))
+        Error = 0 # total error
+
+        for sample in range(samples):
+            output = self.feed_forward(train_sample[sample,:]) # calculate one output at a time
+            Error += output - sample_target[sample]
+            # Batch learning
+
+            for j in range(num_hidden):
+                beta[j] = ( -1 / (2*(self.delta[j]**2)) )
+
+                w_gradient[j] = w_gradient[j] + (output - sample_target[sample])*\
+                                                np.exp( beta[j] * (self.Euclidean(train_sample[sample,:], self.center[j]) ** 2) )
+                c_gradient[j] = c_gradient[j] + (output - sample_target[sample])*self.w_out[0,j]*beta[j]*( self.Euclidean(train_sample[sample,:],self.center[j] )) \
+                                  *np.exp( beta[j] * (self.Euclidean(train_sample[sample,:], self.center[j]) ** 2) )
+                delta_gradient[j] = delta_gradient[j] + (output - sample_target[sample])*(self.Euclidean(train_sample[sample,:],self.center[j])**2)\
+                                                        *self.w_out[0,j]*( (self.delta[j])**(-3) )* \
+                                                        np.exp(beta[j] * (
+                                                        self.Euclidean(train_sample[sample, :], self.center[j]) ** 2))
+                if self.delta[j] > 0:
+                   if delta_gradient[j] < 0:
+                      print('error =',output - sample_target[sample])
+
+        for i in range(num_hidden):
+           self.w_out[0,i] += -lr*w_gradient[i]/samples
+           self.center[i] += 2*lr*c_gradient[i]/samples
+           self.delta[i] += -lr*delta_gradient[i]/samples
+
+
+        #print('w_out =', self.w_out)
+        #print('center =', self.center)
+        print('delta =', self.delta)
+
+
+        return Error # scale in [0,1]
+
+    def predict(self, test_data):
+        # predict for one test data
+        estimate = self.feed_forward(test_data)
+        # decode
+        estimate = Min + estimate * (Max - Min)
+        return estimate
+
+if __name__ == '__main__':
+
+   Max = max(IBM.iloc[:,1])
+   Min = min(IBM.iloc[:,1])
+   # network parameters
+   # Use close price as prediction
+   slide_window = 3  # days of data to predict one future value, which is seen as feature
+   duration = ibm_train.shape[0] - slide_window # days duration of whole predict process
+   #duration = 1
+   input_neurons = slide_window # number of features = input neurons number
+   hidden_neurons = 15
+   weight = np.zeros((1,hidden_neurons)) # weight = 1*10 matrix
+   for j in range(hidden_neurons):
+       weight[0,j] = rd.uniform(0,1)
+
+   rbf = RBFNN(input_neurons, hidden_neurons, None, weight) # build an RBF network archictecture
+
+   # create training set time series
+   samples = duration
+   train_set = np.zeros((duration,slide_window))
+   target = np.zeros((samples,1))
+
+   for sample in range(samples):
+       train_set[sample,:] = ibm_train[sample:(sample + slide_window)]
+       target[sample] = ibm[sample + slide_window,1]
+
+
+   Iteration = 100
+   Error = 0
+   Performance = np.zeros((Iteration,1))
+   Predict = np.zeros((Iteration,1))
+   for iterate in range(Iteration):
+       error = 0
+       # Batch learning
+       error = rbf.train(train_set, target)  # output = total error
+       E = error * (Max - Min) / samples + Min
+       print('Error in epoch: ', E)
+       Performance[iterate] = E
+       Predict[iterate] = rbf.predict(train_set[0, :])
+
+   #print(Performance)
+   plt.figure()
+   plt.title('Error Performance')
+   plt.plot(Performance)
+
+   # training set performance
+   check = np.zeros((train_set.shape[0], 1))
+   for i in range(train_set.shape[0]):
+       check[i] = rbf.predict(train_set[i,:])
+       target[i] = Min + (Max - Min)*target[i]
+
+   # test set performance
+   test_duration = ibm_test.shape[0] - slide_window
+   test_set = np.zeros((test_duration,slide_window))
+   for sample in range(test_set.shape[0]):
+       test_set[sample,:] = ibm_test[sample:sample + slide_window]
+   test_target = ibm_test[slide_window:]
+   test_out = np.zeros((train_set.shape[0], 1))
+   for i in range(test_set.shape[0]):
+       test_out[i] = rbf.predict(test_set[i, :])
+       test_target[i] = Min + (Max - Min) * test_target[i]
+
+   plt.figure()
+   plt.title('test performance')
+   plt.plot(test_target, 'r-', label='Real output')
+   plt.plot(test_out, 'b-', label='Predict output')
+   plt.legend(loc='upper right')
+
+   plt.show()