From b6ef93b7bd39a4e8b13ea73959347e2374505691 Mon Sep 17 00:00:00 2001
From: eriklindernoren <eriklindernoren@live.se>
Date: Wed, 4 Oct 2017 14:18:57 +0200
Subject: [PATCH] Cleanup

---
 mlfromscratch/examples/neuroevolution.py             |  5 +++++
 mlfromscratch/examples/random_forest.py              |  4 ++--
 mlfromscratch/supervised_learning/decision_tree.py   | 11 ++++-------
 .../supervised_learning/gradient_boosting.py         |  8 +++-----
 .../supervised_learning/k_nearest_neighbors.py       |  4 ++--
 .../supervised_learning/multilayer_perceptron.py     |  2 --
 mlfromscratch/supervised_learning/neuroevolution.py  | 12 ++++--------
 mlfromscratch/supervised_learning/perceptron.py      |  6 ++++--
 mlfromscratch/supervised_learning/random_forest.py   |  9 ++++-----
 mlfromscratch/supervised_learning/regression.py      |  3 ---
 .../principal_component_analysis.py                  |  9 +++------
 11 files changed, 31 insertions(+), 42 deletions(-)

diff --git a/mlfromscratch/examples/neuroevolution.py b/mlfromscratch/examples/neuroevolution.py
index 09f57d25..505782a7 100644
--- a/mlfromscratch/examples/neuroevolution.py
+++ b/mlfromscratch/examples/neuroevolution.py
@@ -24,8 +24,13 @@ def model_builder(n_inputs, n_outputs):
         model.add(Activation('relu'))
         model.add(Dense(n_outputs))
         model.add(Activation('softmax'))
+
         return model
 
+    # Print the model summary of a individual in the population
+    print ()
+    model_builder(n_inputs=X.shape[1], n_outputs=y.shape[1]).summary()
+
     X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.4)
 
     model = Neuroevolution(population_size=100, 
diff --git a/mlfromscratch/examples/random_forest.py b/mlfromscratch/examples/random_forest.py
index 36d306df..38f6a816 100644
--- a/mlfromscratch/examples/random_forest.py
+++ b/mlfromscratch/examples/random_forest.py
@@ -5,13 +5,13 @@
 from mlfromscratch.supervised_learning import RandomForest
 
 def main():
-    data = datasets.load_iris()
+    data = datasets.load_digits()
     X = data.data
     y = data.target
 
     X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.4, seed=2)
 
-    clf = RandomForest()
+    clf = RandomForest(n_estimators=100)
     clf.fit(X_train, y_train)
     y_pred = clf.predict(X_test)
 
diff --git a/mlfromscratch/supervised_learning/decision_tree.py b/mlfromscratch/supervised_learning/decision_tree.py
index 2f548fe9..2d896339 100644
--- a/mlfromscratch/supervised_learning/decision_tree.py
+++ b/mlfromscratch/supervised_learning/decision_tree.py
@@ -3,9 +3,6 @@
 
 from mlfromscratch.utils import divide_on_feature, train_test_split, standardize, mean_squared_error
 from mlfromscratch.utils import calculate_entropy, accuracy_score, calculate_variance
-from mlfromscratch.unsupervised_learning import PCA
-from mlfromscratch.utils import Plot
-
 
 class DecisionNode():
     """Class that represents a decision node or leaf in the decision tree
@@ -118,10 +115,10 @@ def _build_tree(self, X, y, current_depth=0):
                             largest_impurity = impurity
                             best_criteria = {"feature_i": feature_i, "threshold": threshold}
                             best_sets = {
-                                "leftX": Xy1[:, :n_features],
-                                "lefty": Xy1[:, n_features:],
-                                "rightX": Xy2[:, :n_features],
-                                "righty": Xy2[:, n_features:]
+                                "leftX": Xy1[:, :n_features],   # X of left subtree
+                                "lefty": Xy1[:, n_features:],   # y of left subtree
+                                "rightX": Xy2[:, :n_features],  # X of right subtree
+                                "righty": Xy2[:, n_features:]   # y of right subtree
                                 }
 
         if largest_impurity > self.min_impurity:
diff --git a/mlfromscratch/supervised_learning/gradient_boosting.py b/mlfromscratch/supervised_learning/gradient_boosting.py
index 9b84f99c..c2c43a84 100644
--- a/mlfromscratch/supervised_learning/gradient_boosting.py
+++ b/mlfromscratch/supervised_learning/gradient_boosting.py
@@ -59,12 +59,10 @@ def __init__(self, n_estimators, learning_rate, min_samples_split,
 
     def fit(self, X, y):
         y_pred = np.full(np.shape(y), np.mean(y, axis=0))
-        
         for i in self.bar(range(self.n_estimators)):
-            tree = self.trees[i]
             gradient = self.loss.gradient(y, y_pred)
-            tree.fit(X, gradient)
-            update = tree.predict(X)
+            self.trees[i].fit(X, gradient)
+            update = self.trees[i].predict(X)
             # Update y prediction
             y_pred -= np.multiply(self.learning_rate, update)
 
@@ -72,7 +70,7 @@ def fit(self, X, y):
     def predict(self, X):
         y_pred = np.array([])
         # Make predictions
-        for i, tree in enumerate(self.trees):
+        for tree in self.trees:
             update = tree.predict(X)
             update = np.multiply(self.learning_rate, update)
             y_pred = -update if not y_pred.any() else y_pred - update
diff --git a/mlfromscratch/supervised_learning/k_nearest_neighbors.py b/mlfromscratch/supervised_learning/k_nearest_neighbors.py
index dff224d1..f9c4b488 100644
--- a/mlfromscratch/supervised_learning/k_nearest_neighbors.py
+++ b/mlfromscratch/supervised_learning/k_nearest_neighbors.py
@@ -16,7 +16,7 @@ def __init__(self, k=5):
         self.k = k
 
     def _vote(self, neighbors):
-        """ Return the most common label among the neighbors """
+        """ Return the most common class among the neighbor samples """
         counts = np.bincount(neighbors[:, 1].astype('int'))
         return counts.argmax()
 
@@ -36,7 +36,7 @@ def predict(self, X_test, X_train, y_train):
             # Sort the list of observed samples from lowest to highest distance
             # and select the k first
             k_nearest_neighbors = neighbors[neighbors[:, 0].argsort()][:self.k]
-            # Get the most common label among the neighbors
+            # Get the most common class among the neighbors
             label = self._vote(k_nearest_neighbors)
             y_pred[i] = label
         return y_pred
diff --git a/mlfromscratch/supervised_learning/multilayer_perceptron.py b/mlfromscratch/supervised_learning/multilayer_perceptron.py
index e49ad1f1..6f42c6af 100644
--- a/mlfromscratch/supervised_learning/multilayer_perceptron.py
+++ b/mlfromscratch/supervised_learning/multilayer_perceptron.py
@@ -82,10 +82,8 @@ def fit(self, X, y):
     # Use the trained model to predict labels of X
     def predict(self, X):
         # Forward pass:
-        # Calculate hidden layer
         hidden_input = X.dot(self.W) + self.w0
         hidden_output = self.hidden_activation(hidden_input)
-        # Calculate output layer
         output_layer_input = hidden_output.dot(self.V) + self.v0
         y_pred = self.output_activation(output_layer_input)
         return y_pred
diff --git a/mlfromscratch/supervised_learning/neuroevolution.py b/mlfromscratch/supervised_learning/neuroevolution.py
index 2985328c..57bdd69d 100644
--- a/mlfromscratch/supervised_learning/neuroevolution.py
+++ b/mlfromscratch/supervised_learning/neuroevolution.py
@@ -2,8 +2,6 @@
 import numpy as np
 import copy
 
-from mlfromscratch.utils.misc import bar_widgets
-
 class Neuroevolution():
     """ Evolutionary optimization of Neural Networks.
 
@@ -78,7 +76,7 @@ def _crossover(self, parent1, parent2):
 
     def _calculate_fitness(self):
         """ Evaluate the NNs on the test set to get fitness scores """
-        for i, individual in enumerate(self.population):
+        for individual in self.population:
             loss, acc = individual.test_on_batch(self.X, self.y)
             individual.fitness = 1 / (loss + 1e-8)
             individual.accuracy = acc
@@ -89,12 +87,10 @@ def evolve(self, X, y, n_generations):
 
         self._initialize_population()
 
-        # Print the model summary of the population's individuals
-        print ()
-        self.population[0].summary()
-
         # The 40% highest fittest individuals will be selected for the next generation
         n_winners = int(self.population_size * 0.4)
+        # The fittest 60% of the population will be selected as parents to form offspring
+        n_parents = self.population_size - n_winners
 
         for epoch in range(n_generations):
             # Determine the fitness of the individuals in the population
@@ -113,7 +109,7 @@ def evolve(self, X, y, n_generations):
             next_population = [self.population[i] for i in range(n_winners)]
 
             # The fittest 60% of the population are selected as parents
-            parents = [self.population[i] for i in range(self.population_size - n_winners)]
+            parents = [self.population[i] for i in range(n_parents)]
             for i in np.arange(0, len(parents), 2):
                 # Perform crossover to produce offspring
                 child1, child2 = self._crossover(parents[i], parents[i+1])
diff --git a/mlfromscratch/supervised_learning/perceptron.py b/mlfromscratch/supervised_learning/perceptron.py
index 1fcdca02..dfedf171 100644
--- a/mlfromscratch/supervised_learning/perceptron.py
+++ b/mlfromscratch/supervised_learning/perceptron.py
@@ -7,7 +7,8 @@
 from mlfromscratch.deep_learning.activation_functions import Sigmoid, ReLU, SoftPlus, LeakyReLU, TanH, ELU
 from mlfromscratch.deep_learning.loss_functions import CrossEntropy, SquareLoss
 from mlfromscratch.utils import Plot
-
+from mlfromscratch.utils.misc import bar_widgets
+import progressbar
 
 class Perceptron():
     """The Perceptron. One layer neural network classifier.
@@ -30,6 +31,7 @@ def __init__(self, n_iterations=20000, activation_function=Sigmoid, loss=SquareL
         self.learning_rate = learning_rate
         self.loss = loss()
         self.activation_func = activation_function()
+        self.progressbar = progressbar.ProgressBar(widgets=bar_widgets)
 
     def fit(self, X, y):
         n_samples, n_features = np.shape(X)
@@ -40,7 +42,7 @@ def fit(self, X, y):
         self.W = np.random.uniform(-limit, limit, (n_features, n_outputs))
         self.w0 = np.zeros((1, n_outputs))
 
-        for i in range(self.n_iterations):
+        for i in self.progressbar(range(self.n_iterations)):
             # Calculate outputs
             linear_output = X.dot(self.W) + self.w0
             y_pred = self.activation_func(linear_output)
diff --git a/mlfromscratch/supervised_learning/random_forest.py b/mlfromscratch/supervised_learning/random_forest.py
index b84fabfc..b77e45c3 100644
--- a/mlfromscratch/supervised_learning/random_forest.py
+++ b/mlfromscratch/supervised_learning/random_forest.py
@@ -31,10 +31,9 @@ class RandomForest():
         The maximum depth of a tree.
     """
     def __init__(self, n_estimators=100, max_features=None, min_samples_split=2,
-                 min_gain=1e-7, max_depth=float("inf")):
+                 min_gain=0, max_depth=float("inf")):
         self.n_estimators = n_estimators    # Number of trees
         self.max_features = max_features    # Maxmimum number of features per tree
-        self.feature_indices = []           # The indices of the features used for each tree
         self.min_samples_split = min_samples_split
         self.min_gain = min_gain            # Minimum information gain req. to continue
         self.max_depth = max_depth          # Maximum depth for tree
@@ -64,7 +63,7 @@ def fit(self, X, y):
             # Feature bagging (select random subsets of the features)
             idx = np.random.choice(range(n_features), size=self.max_features, replace=True)
             # Save the indices of the features for prediction
-            self.feature_indices.append(idx)
+            self.trees[i].feature_indices = idx
             # Choose the features corresponding to the indices
             X_subset = X_subset[:, idx]
             # Fit the tree to the data
@@ -74,8 +73,8 @@ def predict(self, X):
         y_preds = np.empty((X.shape[0], len(self.trees)))
         # Let each tree make a prediction on the data
         for i, tree in enumerate(self.trees):
-            # Select the features that the tree has trained on
-            idx = self.feature_indices[i]
+            # Indices of the features that the tree has trained on
+            idx = tree.feature_indices
             # Make a prediction based on those features
             prediction = tree.predict(X[:, idx])
             y_preds[:, i] = prediction
diff --git a/mlfromscratch/supervised_learning/regression.py b/mlfromscratch/supervised_learning/regression.py
index e20e0077..beb0b5ae 100644
--- a/mlfromscratch/supervised_learning/regression.py
+++ b/mlfromscratch/supervised_learning/regression.py
@@ -133,7 +133,6 @@ class LassoRegression(Regression):
     """
     def __init__(self, degree, reg_factor, n_iterations=3000, learning_rate=0.01):
         self.degree = degree
-        # Lasso Regression
         self.regularization = l1_regularization(alpha=reg_factor)
         super(LassoRegression, self).__init__(n_iterations, 
                                             learning_rate)
@@ -189,7 +188,6 @@ class RidgeRegression(Regression):
         The step length that will be used when updating the weights.
     """
     def __init__(self, reg_factor, n_iterations=1000, learning_rate=0.001):
-        # Ridge Regression
         self.regularization = l2_regularization(alpha=reg_factor)
         super(RidgeRegression, self).__init__(n_iterations, 
                                             learning_rate)
@@ -211,7 +209,6 @@ class PolynomialRidgeRegression(Regression):
     """
     def __init__(self, degree, reg_factor, n_iterations=3000, learning_rate=0.01, gradient_descent=True):
         self.degree = degree
-        # Ridge Regression
         self.regularization = l2_regularization(alpha=reg_factor)
         super(PolynomialRidgeRegression, self).__init__(n_iterations, 
                                                         learning_rate)
diff --git a/mlfromscratch/unsupervised_learning/principal_component_analysis.py b/mlfromscratch/unsupervised_learning/principal_component_analysis.py
index cd54c5af..92e554d4 100644
--- a/mlfromscratch/unsupervised_learning/principal_component_analysis.py
+++ b/mlfromscratch/unsupervised_learning/principal_component_analysis.py
@@ -10,16 +10,13 @@ class PCA():
     maximizing the variance along each feature axis. This class is also used throughout
     the project to plot data.
     """
-    def __init__(self): pass
-
     def transform(self, X, n_components):
         """ Fit the dataset to the number of principal components specified in the 
         constructor and return the transformed dataset """
-        covariance = calculate_covariance_matrix(X)
+        covariance_matrix = calculate_covariance_matrix(X)
 
-        # Get the eigenvalues and eigenvectors.
-        # (eigenvector[:,0] corresponds to eigenvalue[0])
-        eigenvalues, eigenvectors = np.linalg.eig(covariance)
+        # Where (eigenvector[:,0] corresponds to eigenvalue[0])
+        eigenvalues, eigenvectors = np.linalg.eig(covariance_matrix)
 
         # Sort the eigenvalues and corresponding eigenvectors from largest
         # to smallest eigenvalue and select the first n_components