implementation with testing(finished) -Albi

Idate96 · Oct 26, 2017 · 4463b07 · 4463b07
1 parent 4a82e08
commit 4463b07
Show file tree

Hide file tree

Showing 4 changed files with 153 additions and 108 deletions.
diff --git a/src/ML_Methods.py b/src/ML_Methods.py
@@ -4,167 +4,212 @@
 import datetime
 import numpy as np
 
-"""Functions."""
-
-def check_input(y, tx, lambda_ = 0, initial_w = 0, max_iters = 0, gamma = 0):
-    """check that all types are correct takes 4 times more"""
-    w = initial_w.astype(float)
-    y = y.astype(float)
-    tx = tx.astype(float)
-    max_iters = int(max_iters)
-    gamma = float(gamma)
-    lambda_ = float(lambda_)
-    return y, tx, lambda_, initial_w, max_iters, gamma
+"""Functions"""
+
+def check_input(y, tx, lambda_ = 0, initial_w = np.array([0,0]), max_iters = 0, gamma = 0):
+    """check that all types are correct takes more time"""
+    y_check = y.astype(float)
+    tx_check = tx.astype(float)
+    lambda__check = float(lambda_)
+    w_check = initial_w.astype(float)
+    max_iters_check = int(max_iters)
+    gamma_check = float(gamma)
+    return y_check, tx_check, lambda__check, w_check, max_iters_check, gamma_check
 
 def compute_loss_MSE(y, tx, w):
     """calculate loss using mean squared error"""
     e = y - tx @ w
     loss = 1/(2*np.shape(tx)[0]) * e.T @ e
     return loss
-def check_convergence(loss0, loss1):
-    """check for convergence"""
-    threshold = 1e-8
-    loss = 0
-    loss1 = -1 / np.shape(tx)[0] * np.sum((1 - y) * np.log(1 - sigmoid) + y * np.log(sigmoid))
-    if np.abs(loss - loss1) < threshold:
-        loss = loss1
 
-    loss = loss1
+def compute_loss_logistic_regression(y, tx, w):
+    """calculate loss for logistic regression"""
+    sigmoid = 1 / (1 + np.exp(-(tx @ w)))
+    loss = -1 / np.shape(tx)[0] * np.sum((1 - y) * np.log(1 - sigmoid) + y * np.log(sigmoid))
     return loss
-def least_squares_GD(y, tx, initial_w, max_iters, gamma):
 
-    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx, lambda_=0, initial_w = initial_w,
+def check_early_convergence(loss_previous, loss_now, n_iter, threshold = 1e-8):
+    """check for convergence and print the iteration at which it occurs"""
+    if np.abs(loss_now - loss_previous) < threshold:
+        return print('convergence reached at iteration '+str(n_iter-1)+ ', try set max_iters to '+str(n_iter))
+
+def shuffle_dataset(y, tx):
+    """shuffling dataset"""
+    # np.random.seed(1) #if commented selects every time you run a different seed
+    random_shuffle = np.random.permutation(np.arange(np.shape(tx)[0]))
+    shuffled_y = y[random_shuffle]
+    shuffled_tx = tx[random_shuffle]
+    return shuffled_y, shuffled_tx
+
+def least_squares_GD(y, tx, initial_w, max_iters, gamma):
+    """Computes least squares using Gradient Descent"""
+    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx, initial_w = initial_w,
                                                               max_iters = max_iters, gamma = gamma)
+    loss = 0
 
     for n_iter in range(max_iters):
         e = y - tx @ w
         gradient = -1 / np.shape(tx)[0] * tx.T @ e
         w = w - gamma * gradient
+        loss_now = compute_loss_MSE(y, tx, w)
+        check_early_convergence(loss, loss_now, n_iter)
+        loss = loss_now
 
-    loss = compute_loss_MSE(y, tx, w)
     return w, loss
 
-
 def least_squares_SGD(y, tx, initial_w, max_iters, gamma):
-    w = initial_w
-    #shuffling dataset
-    #np.random.seed(1) #if commented selects every time you run a different seed
-    random_shuffle =  np.random.permutation(np.arange(np.shape(tx)[0]))
-    shuffled_y = y[random_shuffle]
-    shuffled_tx = tx[random_shuffle]
-
+    """Computes least squares using Stochastic Gradient Descent"""
+    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx, initial_w=initial_w,
+                                                      max_iters=max_iters, gamma=gamma)
+    shuffled_y, shuffled_tx = shuffle_dataset(y, tx)
+    loss = 0
+
     for n_iter in range(max_iters):
+
         for training_example in range(np.shape(tx)[0]):
             e = shuffled_y[training_example] -shuffled_tx[training_example] @ w
             gradient = -e * shuffled_tx[training_example]
             w = w - gamma * gradient
+        loss_now = compute_loss_MSE(shuffled_y, shuffled_tx, w)
+        check_early_convergence(loss, loss_now, n_iter)
+        loss = loss_now
 
-    e = shuffled_y - shuffled_tx @ w
-    loss = 1 / (2 * np.shape(tx)[0]) * e.T @ e
     return w, loss
 
 
 def least_squares(y, tx):
+    """Computes least squares using Normal equations"""
+    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx)
     w = np.linalg.inv(tx.T @ tx) @ tx.T @ y
-    e = y - tx @ w
-    loss = 1 / (2 * np.shape(tx)[0]) * e.T @ e
+    loss = compute_loss_MSE(y, tx, w)
     return w, loss
 
 
 def ridge_regression(y, tx, lambda_ ):
+    """Computes ridge regression using normal equations"""
+    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx, lambda_=lambda_)
     w = np.linalg.inv(tx.T @ tx + lambda_ * 2 * np.shape(y)[0] * np.eye(np.shape(tx)[1])) @ tx.T @ y
-    e = y - tx @ w
-    loss = 1 / (2 * np.shape(tx)[0]) * e.T @ e + lambda_ * w.T @ w
+    loss = compute_loss_MSE(y, tx, w) + lambda_ * w.T @ w
     return w, loss
 
 
 def logistic_regression(y, tx, initial_w, max_iters, gamma):
-    w = initial_w
-    threshold = 1e-8
+    """Computes logistic regression using gradient descent"""
+    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx, initial_w=initial_w,
+                                                      max_iters=max_iters, gamma=gamma)
     loss = 0
 
     for n_iter in range(max_iters):
         sigmoid = 1/ (1 + np.exp(-(tx @ w)))
         gradient = -1/np.shape(tx)[0] * tx.T @ (y-sigmoid)
         w = w-gamma * gradient
-        loss1 = -1 / np.shape(tx)[0] * np.sum((1 - y) * np.log(1 - sigmoid) + y * np.log(sigmoid))
-        if np.abs(loss - loss1) < threshold:
-            loss = loss1
-            break
-        loss = loss1
+        loss_now = compute_loss_logistic_regression(y, tx, w)
+        check_early_convergence(loss, loss_now, n_iter)
+        loss = loss_now
+
     return w, loss
 
+
 def reg_logistic_regression(y, tx, lambda_ , initial_w, max_iters, gamma):
-    w = initial_w
+    """Computes regularized logistic regression using gradient descent"""
+    y, tx, lambda_, w, max_iters, gamma = check_input(y, tx, lambda_ = lambda_,initial_w=initial_w,
+                                                      max_iters=max_iters, gamma=gamma)
+    loss = 0
 
     for n_iter in range(max_iters):
         sigmoid = 1 / (1 + np.exp(-(tx @ w)))
         gradient = -1 / np.shape(tx)[0] * tx.T @ (y - sigmoid) + 2 * lambda_ * w
         w = w - gamma * gradient
-
-    loss = -1 / np.shape(tx)[0] * np.sum((1 - y) * np.log(1 - sigmoid) + y * np.log(sigmoid)) + lambda_ * w.T @ w
+        loss_now = compute_loss_logistic_regression(y, tx, w) + lambda_ * w.T @ w
+        check_early_convergence(loss, loss_now, n_iter)
+        loss = loss_now
 
     return w, loss
 
-
- #test data for least square
-with open(r"data.pickle", "rb") as input_file:
-    data = pickle.load(input_file)
-y = data[0]
-tx = data[1]
-print(y)
-print(tx[0])
-'''
-#test data for logistic regression
-with open(r"tx_regression.pickle", "rb") as input_file:
-    tx = pickle.load(input_file)
-with open(r"y_regression.pickle", "rb") as input_file:
-    y = pickle.load(input_file)
-'''
-
-#check least_squares_GD()
-start_time = datetime.datetime.now()
-print(least_squares_GD(y,tx,np.array([0,0]), 50, 0.7))
-end_time = datetime.datetime.now()
-exection_time = (end_time - start_time).total_seconds()
-print("Gradient Descent: execution time={t:.3f} seconds".format(t=exection_time))
-
-'''check least_squares_SGD()
-start_time = datetime.datetime.now()
-print(least_squares_SGD(y,tx,np.array([0,0]), 1, 0.01))
-end_time = datetime.datetime.now()
-exection_time = (end_time - start_time).total_seconds()
-print("Stochastic Gradient Descent: execution time={t:.3f} seconds".format(t=exection_time))
-'''
-
-''' least squares
-start_time = datetime.datetime.now()
-print(least_squares(y,tx))
-end_time = datetime.datetime.now()
-exection_time = (end_time - start_time).total_seconds()
-print("Normal equation least squares: execution time={t:.3f} seconds".format(t=exection_time))
-'''
-''' ridge_regression
-start_time = datetime.datetime.now()
-print(ridge_regression(y,tx, 10000))
-end_time = datetime.datetime.now()
-exection_time = (end_time - start_time).total_seconds()
-print("Regularized Normal equation least squares: execution time={t:.3f} seconds".format(t=exection_time))
-'''
-'''logistic regression
-start_time = datetime.datetime.now()
-print(logistic_regression(y,tx, np.zeros((tx.shape[1], 1)), 10000, 1))
-end_time = datetime.datetime.now()
-exection_time = (end_time - start_time).total_seconds()
-print("logistic regression: execution time={t:.3f} seconds".format(t=exection_time))
-'''
-
-'''reg_logistic regression
-start_time = datetime.datetime.now()
-print(reg_logistic_regression(y,tx, 0.05, np.zeros((tx.shape[1], 1)), 401, 0.1))
-end_time = datetime.datetime.now()
-exection_time = (end_time - start_time).total_seconds()
-print("regularized logistic regression: execution time={t:.3f} seconds".format(t=exection_time))
-'''
-
-
+"""Testing"""
+
+loop = True
+
+while loop:
+    input_user = input('Test:\n 1 Least square \n 2 Logistic regression \n 3 end \n ')
+
+    if int(input_user) == 1:
+        """load data for least squares"""
+        with open(r"test_ML_methods/data.pickle", "rb") as input_file:
+            data = pickle.load(input_file)
+        y = data[0]
+        tx = data[1]
+        test = input('ML Methods\n 1 least_squares_GD \n 2 least_squares_SGD \n 3 least_squares(Normal Equation) \n'
+                     ' 4 ridge_regression(Normal Equation) \n ')
+
+        if int(test) == 1:
+            """run least_squares_GD"""
+            start_time = datetime.datetime.now()
+            function = least_squares_GD(y, tx, np.array([0, 0]), 12, 0.7)
+            print('weights = ' , function[0], 'loss = ', function[1])
+            end_time = datetime.datetime.now()
+            exection_time = (end_time - start_time).total_seconds()
+            print("Gradient Descent: execution time={t:.3f} seconds".format(t=exection_time))
+
+        elif int(test) == 2:
+            """run least_squares_SGD"""
+            start_time = datetime.datetime.now()
+            function = least_squares_SGD(y, tx, np.array([0, 0]), 1, 0.01)
+            print('weights = ', function[0], 'loss = ', function[1])
+            end_time = datetime.datetime.now()
+            exection_time = (end_time - start_time).total_seconds()
+            print("Stochastic Gradient Descent: execution time={t:.3f} seconds".format(t=exection_time))
+
+        elif int(test) == 3:
+            """run least_squares(Normal Equation)"""
+            start_time = datetime.datetime.now()
+            function = least_squares(y, tx)
+            print('weights = ', function[0], 'loss = ', function[1])
+            end_time = datetime.datetime.now()
+            exection_time = (end_time - start_time).total_seconds()
+            print("Normal equation least squares: execution time={t:.3f} seconds".format(t=exection_time))
+
+        elif int(test) == 4:
+            """run ridge_regression(Normal Equation)"""
+            start_time = datetime.datetime.now()
+            function = ridge_regression(y, tx, 0.0001)
+            print('weights = ', function[0], 'loss = ', function[1])
+            end_time = datetime.datetime.now()
+            exection_time = (end_time - start_time).total_seconds()
+            print("Regularized Normal equation least squares: execution time={t:.3f} seconds".format(t=exection_time))
+
+        else:
+            loop = False
+
+
+    elif int(input_user) == 2:
+        """load data for logistic regression"""
+        with open(r"test_ML_methods/tx_regression.pickle", "rb") as input_file:
+            tx = pickle.load(input_file)
+        with open(r"test_ML_methods/y_regression.pickle", "rb") as input_file:
+            y = pickle.load(input_file)
+        test = input('ML Methods\n 1 logistic_regression(Gradient Descent) \n 2 reg_logistic_regression(Gradient Descent) \n ')
+
+        if int(test) == 1:
+            """run logistic_regression"""
+            start_time = datetime.datetime.now()
+            function = logistic_regression(y, tx, np.zeros((tx.shape[1], 1)), 1846, 1)
+            print('weights = ', function[0], 'loss = ', function[1])
+            end_time = datetime.datetime.now()
+            exection_time = (end_time - start_time).total_seconds()
+            print("logistic regression: execution time={t:.3f} seconds".format(t=exection_time))
+
+        elif int(test) == 2:
+            """run ridge_regression(Normal Equation)"""
+            start_time = datetime.datetime.now()
+            function = reg_logistic_regression(y, tx, 0, np.zeros((tx.shape[1], 1)), 1846, 1)
+            print('weights = ', function[0], 'loss = ', function[1])
+            end_time = datetime.datetime.now()
+            exection_time = (end_time - start_time).total_seconds()
+            print("regularized logistic regression: execution time={t:.3f} seconds".format(t=exection_time))
+
+    elif int(input_user) == 3:
+        loop = False
+
+    else:
+        loop = False
diff --git a/src/data.pickle → src/test_ML_methods/data.pickle b/src/data.pickle → src/test_ML_methods/data.pickle
diff --git a/src/tx_regression.pickle → src/test_ML_methods/tx_regression.pickle b/src/tx_regression.pickle → src/test_ML_methods/tx_regression.pickle
diff --git a/src/y_regression.pickle → src/test_ML_methods/y_regression.pickle b/src/y_regression.pickle → src/test_ML_methods/y_regression.pickle