Merge pull request #2531 from taneemishere/Taneem_Jan

All machine learning algorithms are being moved to machine_learning directory plus SVM in python is also added.
ZoranPandovski · Oct 13, 2020 · 5c4435d · 5c4435d
2 parents 63e97a3 + b429fdb
commit 5c4435d
Show file tree

Hide file tree

Showing 93 changed files with 167 additions and 119 deletions.
diff --git a/K Means Clustering/MATLAB/README.md → ...rning/K Means Clustering/MATLAB/README.md b/K Means Clustering/MATLAB/README.md → ...rning/K Means Clustering/MATLAB/README.md
diff --git a/K Means Clustering/MATLAB/computeCentroids.m → ...eans Clustering/MATLAB/computeCentroids.m b/K Means Clustering/MATLAB/computeCentroids.m → ...eans Clustering/MATLAB/computeCentroids.m
diff --git a/K Means Clustering/MATLAB/featureNormalize.m → ...eans Clustering/MATLAB/featureNormalize.m b/K Means Clustering/MATLAB/featureNormalize.m → ...eans Clustering/MATLAB/featureNormalize.m
diff --git a/... Clustering/MATLAB/findClosestCentroids.m → ... Clustering/MATLAB/findClosestCentroids.m b/... Clustering/MATLAB/findClosestCentroids.m → ... Clustering/MATLAB/findClosestCentroids.m
diff --git a/...s Clustering/MATLAB/kMeansInitCentroids.m → ...s Clustering/MATLAB/kMeansInitCentroids.m b/...s Clustering/MATLAB/kMeansInitCentroids.m → ...s Clustering/MATLAB/kMeansInitCentroids.m
diff --git a/K Means Clustering/MATLAB/plotDataPoints.m → ... Means Clustering/MATLAB/plotDataPoints.m b/K Means Clustering/MATLAB/plotDataPoints.m → ... Means Clustering/MATLAB/plotDataPoints.m
diff --git a/...ns Clustering/MATLAB/plotProgresskMeans.m → ...ns Clustering/MATLAB/plotProgresskMeans.m b/...ns Clustering/MATLAB/plotProgresskMeans.m → ...ns Clustering/MATLAB/plotProgresskMeans.m
diff --git a/K Means Clustering/MATLAB/runkMeans.m → ...ing/K Means Clustering/MATLAB/runkMeans.m b/K Means Clustering/MATLAB/runkMeans.m → ...ing/K Means Clustering/MATLAB/runkMeans.m
diff --git a/K Means Clustering/MATLAB/test_data2.mat → .../K Means Clustering/MATLAB/test_data2.mat b/K Means Clustering/MATLAB/test_data2.mat → .../K Means Clustering/MATLAB/test_data2.mat
diff --git a/K Means Clustering/MATLAB/test_data_1.mat → ...K Means Clustering/MATLAB/test_data_1.mat b/K Means Clustering/MATLAB/test_data_1.mat → ...K Means Clustering/MATLAB/test_data_1.mat
diff --git a/K Means Clustering/README.md → ...ine_learning/K Means Clustering/README.md b/K Means Clustering/README.md → ...ine_learning/K Means Clustering/README.md
diff --git a/K-Nearest Neighbour/Java/Main.java → ...arning/K-Nearest Neighbour/Java/Main.java b/K-Nearest Neighbour/Java/Main.java → ...arning/K-Nearest Neighbour/Java/Main.java
diff --git a/K-Nearest Neighbour/Java/Object.java → ...ning/K-Nearest Neighbour/Java/Object.java b/K-Nearest Neighbour/Java/Object.java → ...ning/K-Nearest Neighbour/Java/Object.java
diff --git a/K-Nearest Neighbour/Java/README.md → ...arning/K-Nearest Neighbour/Java/README.md b/K-Nearest Neighbour/Java/README.md → ...arning/K-Nearest Neighbour/Java/README.md
diff --git a/K-Nearest Neighbour/Java/tests.txt → ...arning/K-Nearest Neighbour/Java/tests.txt b/K-Nearest Neighbour/Java/tests.txt → ...arning/K-Nearest Neighbour/Java/tests.txt
diff --git a/K-Nearest Neighbour/README.md → ...ne_learning/K-Nearest Neighbour/README.md b/K-Nearest Neighbour/README.md → ...ne_learning/K-Nearest Neighbour/README.md
diff --git a/...st Neighbour/python/K-NearestNeighbors.py → ...st Neighbour/python/K-NearestNeighbors.py b/...st Neighbour/python/K-NearestNeighbors.py → ...st Neighbour/python/K-NearestNeighbors.py
diff --git a/K-Nearest Neighbour/python/knn.py → ...earning/K-Nearest Neighbour/python/knn.py b/K-Nearest Neighbour/python/knn.py → ...earning/K-Nearest Neighbour/python/knn.py
diff --git a/KMeans_Clustering/KN clustter.ipynb → ...rning/KMeans_Clustering/KN clustter.ipynb b/KMeans_Clustering/KN clustter.ipynb → ...rning/KMeans_Clustering/KN clustter.ipynb
diff --git a/Linear Regression/Linear Regression .ipynb → ...inear Regression/Linear Regression .ipynb b/Linear Regression/Linear Regression .ipynb → ...inear Regression/Linear Regression .ipynb
diff --git a/Linear Regression/USA_Housing.csv → ...earning/Linear Regression/USA_Housing.csv b/Linear Regression/USA_Housing.csv → ...earning/Linear Regression/USA_Housing.csv
diff --git a/...tics Regression/Logistic Regression.ipynb → ...tics Regression/Logistic Regression.ipynb b/...tics Regression/Logistic Regression.ipynb → ...tics Regression/Logistic Regression.ipynb
diff --git a/Logistics Regression/titanic_test.csv → ...ing/Logistics Regression/titanic_test.csv b/Logistics Regression/titanic_test.csv → ...ing/Logistics Regression/titanic_test.csv
diff --git a/Logistics Regression/titanic_train.csv → ...ng/Logistics Regression/titanic_train.csv b/Logistics Regression/titanic_train.csv → ...ng/Logistics Regression/titanic_train.csv
diff --git a/NaiveBayes/R/Naivebayes.r → machine_learning/NaiveBayes/R/Naivebayes.r b/NaiveBayes/R/Naivebayes.r → machine_learning/NaiveBayes/R/Naivebayes.r
diff --git a/NaiveBayes/R/Readme.md → machine_learning/NaiveBayes/R/Readme.md b/NaiveBayes/R/Readme.md → machine_learning/NaiveBayes/R/Readme.md
diff --git a/...ciple Component Analysis/MATLAB/README.md → ...ciple Component Analysis/MATLAB/README.md b/...ciple Component Analysis/MATLAB/README.md → ...ciple Component Analysis/MATLAB/README.md
diff --git a/Principle Component Analysis/MATLAB/pca.m → ...Principle Component Analysis/MATLAB/pca.m b/Principle Component Analysis/MATLAB/pca.m → ...Principle Component Analysis/MATLAB/pca.m
diff --git a/...e Component Analysis/MATLAB/projectData.m → ...e Component Analysis/MATLAB/projectData.m b/...e Component Analysis/MATLAB/projectData.m → ...e Component Analysis/MATLAB/projectData.m
diff --git a/...e Component Analysis/MATLAB/recoverData.m → ...e Component Analysis/MATLAB/recoverData.m b/...e Component Analysis/MATLAB/recoverData.m → ...e Component Analysis/MATLAB/recoverData.m
diff --git a/Principle Component Analysis/README.md → ...ng/Principle Component Analysis/README.md b/Principle Component Analysis/README.md → ...ng/Principle Component Analysis/README.md
diff --git a/Principle Component Analysis/python/PCA.py → ...rinciple Component Analysis/python/PCA.py b/Principle Component Analysis/python/PCA.py → ...rinciple Component Analysis/python/PCA.py
diff --git a/...- Collaborator Filtering/MATLAB/README.md → ...- Collaborator Filtering/MATLAB/README.md b/...- Collaborator Filtering/MATLAB/README.md → ...- Collaborator Filtering/MATLAB/README.md
diff --git a/...laborator Filtering/MATLAB/cofiCostFunc.m → ...laborator Filtering/MATLAB/cofiCostFunc.m b/...laborator Filtering/MATLAB/cofiCostFunc.m → ...laborator Filtering/MATLAB/cofiCostFunc.m
diff --git a/... - Collaborator Filtering/MATLAB/fmincg.m → ... - Collaborator Filtering/MATLAB/fmincg.m b/... - Collaborator Filtering/MATLAB/fmincg.m → ... - Collaborator Filtering/MATLAB/fmincg.m
diff --git a/...rator Filtering/MATLAB/normalizeRatings.m → ...rator Filtering/MATLAB/normalizeRatings.m b/...rator Filtering/MATLAB/normalizeRatings.m → ...rator Filtering/MATLAB/normalizeRatings.m
diff --git a/machine_learning/Support_Vector_Machine/Python/README.md b/machine_learning/Support_Vector_Machine/Python/README.md
@@ -0,0 +1,8 @@
+# Supprt Vector Machine
+
+The Supprt Vector Machine is one of the superivsed learning algorithm of machine learning that is 
+used for both the classification and the regression problems. The main classification of the data 
+points are done through by drawing the optimal hyperplane. But how would the hyperplane be determine
+as the optimal one. Well this algorithm does this drawing the supporting vetors the categories in 
+the dataset. And the main hyperplane would be consider the optimal one that has the wider area between 
+supporting vector.
diff --git a/machine_learning/Support_Vector_Machine/Python/SVM_with_Sklearn.py b/machine_learning/Support_Vector_Machine/Python/SVM_with_Sklearn.py
@@ -0,0 +1,40 @@
+# some imports 
+
+from sklearn import datasets
+from sklearn.model_selection import train_test_split
+from sklearn import svm
+from sklearn import metrics
+
+# read the dataset from sklearn dataset
+cancer = datasets.load_breast_cancer()
+
+# See the features and label names of the dataset
+print("Features are: ", cancer.feature_names)
+print("Labels are: ", cancer.target_names)
+
+# Assign the values to X as featrues and to y the labels
+X = cancer.data
+y = cancer.target
+
+# Split the dataset into 80% and 20% for training and testing respectively
+x_train, x_test, y_train, y_test = train_test_split(X, y, test_size=0.2)
+
+# print(x_train, y_train)
+
+# these are the two classes of the label
+classes = ['malignant', 'benign']
+
+# Support Vector Classifier of Support Vector Machine
+# Here the C is the Soft Margin for the SVM
+
+clf = svm.SVC(kernel="linear", C=2)
+clf.fit(x_train, y_train)
+
+# predict the values of training features
+y_pred = clf.predict(x_test)
+
+# seeing the acuuracy score of the model
+acc = metrics.accuracy_score(y_test, y_pred)
+
+print("Accuracy of SVC: ", acc)
+
diff --git a/SVM/R/Readme.md → ...arning/Support_Vector_Machine/R/Readme.md b/SVM/R/Readme.md → ...arning/Support_Vector_Machine/R/Readme.md
diff --git a/SVM/R/svm.r → ...e_learning/Support_Vector_Machine/R/svm.r b/SVM/R/svm.r → ...e_learning/Support_Vector_Machine/R/svm.r
diff --git a/cluster_analysis/README.md → machine_learning/cluster_analysis/README.md b/cluster_analysis/README.md → machine_learning/cluster_analysis/README.md
diff --git a/cluster_analysis/dbscan/README.md → ...earning/cluster_analysis/dbscan/README.md b/cluster_analysis/dbscan/README.md → ...earning/cluster_analysis/dbscan/README.md
diff --git a/cluster_analysis/dbscan/python/DBScan.py → .../cluster_analysis/dbscan/python/DBScan.py b/cluster_analysis/dbscan/python/DBScan.py → .../cluster_analysis/dbscan/python/DBScan.py
diff --git a/cluster_analysis/dbscan/python/Point.py → ...g/cluster_analysis/dbscan/python/Point.py b/cluster_analysis/dbscan/python/Point.py → ...g/cluster_analysis/dbscan/python/Point.py
diff --git a/cluster_analysis/dbscan/python/__init__.py → ...luster_analysis/dbscan/python/__init__.py b/cluster_analysis/dbscan/python/__init__.py → ...luster_analysis/dbscan/python/__init__.py
diff --git a/cluster_analysis/k-means/c++/kmeans.cpp → ...g/cluster_analysis/k-means/c++/kmeans.cpp b/cluster_analysis/k-means/c++/kmeans.cpp → ...g/cluster_analysis/k-means/c++/kmeans.cpp
diff --git a/cluster_analysis/k-means/example.png → ...ning/cluster_analysis/k-means/example.png b/cluster_analysis/k-means/example.png → ...ning/cluster_analysis/k-means/example.png
diff --git a/cluster_analysis/k-means/python/__init__.py → ...uster_analysis/k-means/python/__init__.py b/cluster_analysis/k-means/python/__init__.py → ...uster_analysis/k-means/python/__init__.py
diff --git a/cluster_analysis/k-means/python/kmeans.py → ...cluster_analysis/k-means/python/kmeans.py b/cluster_analysis/k-means/python/kmeans.py → ...cluster_analysis/k-means/python/kmeans.py
diff --git a/...analysis/k-means/python/model/__init__.py → ...analysis/k-means/python/model/__init__.py b/...analysis/k-means/python/model/__init__.py → ...analysis/k-means/python/model/__init__.py
diff --git a/..._analysis/k-means/python/model/k_point.py → ..._analysis/k-means/python/model/k_point.py b/..._analysis/k-means/python/model/k_point.py → ..._analysis/k-means/python/model/k_point.py
diff --git a/cluster_analysis/k-means/readme.md → ...arning/cluster_analysis/k-means/readme.md b/cluster_analysis/k-means/readme.md → ...arning/cluster_analysis/k-means/readme.md
diff --git a/deep_learning/ANN_architecture_intro.png → .../deep_learning/ANN_architecture_intro.png b/deep_learning/ANN_architecture_intro.png → .../deep_learning/ANN_architecture_intro.png
diff --git a/deep_learning/Readme.md → machine_learning/deep_learning/Readme.md b/deep_learning/Readme.md → machine_learning/deep_learning/Readme.md
diff --git a/deep_learning/python/CNN/image/cnn.gif → ...ng/deep_learning/python/CNN/image/cnn.gif b/deep_learning/python/CNN/image/cnn.gif → ...ng/deep_learning/python/CNN/image/cnn.gif
diff --git a/...earning/python/CNN/mnist-digits/cnn.ipynb → ...earning/python/CNN/mnist-digits/cnn.ipynb b/...earning/python/CNN/mnist-digits/cnn.ipynb → ...earning/python/CNN/mnist-digits/cnn.ipynb
diff --git a/...earning/python/CNN/mnist-digits/readme.md → ...earning/python/CNN/mnist-digits/readme.md b/...earning/python/CNN/mnist-digits/readme.md → ...earning/python/CNN/mnist-digits/readme.md
diff --git a/...ng/python/CNN/mnist-fashion/fashion.ipynb → ...ng/python/CNN/mnist-fashion/fashion.ipynb b/...ng/python/CNN/mnist-fashion/fashion.ipynb → ...ng/python/CNN/mnist-fashion/fashion.ipynb
diff --git a/...arning/python/CNN/mnist-fashion/readme.md → ...arning/python/CNN/mnist-fashion/readme.md b/...arning/python/CNN/mnist-fashion/readme.md → ...arning/python/CNN/mnist-fashion/readme.md
diff --git a/deep_learning/python/CNN/readme.md → ...arning/deep_learning/python/CNN/readme.md b/deep_learning/python/CNN/readme.md → ...arning/deep_learning/python/CNN/readme.md
diff --git a/deep_learning/python/README.md → ...e_learning/deep_learning/python/README.md b/deep_learning/python/README.md → ...e_learning/deep_learning/python/README.md
diff --git a/deep_learning/python/backpropagation.py → ...g/deep_learning/python/backpropagation.py b/deep_learning/python/backpropagation.py → ...g/deep_learning/python/backpropagation.py
diff --git a/deep_learning/python/keras/RNN/README.md → .../deep_learning/python/keras/RNN/README.md b/deep_learning/python/keras/RNN/README.md → .../deep_learning/python/keras/RNN/README.md
diff --git a/deep_learning/python/keras/RNN/rnn.py → ...ing/deep_learning/python/keras/RNN/rnn.py b/deep_learning/python/keras/RNN/rnn.py → ...ing/deep_learning/python/keras/RNN/rnn.py
diff --git a/deep_learning/python/mean_squared_error.py → ...eep_learning/python/mean_squared_error.py b/deep_learning/python/mean_squared_error.py → ...eep_learning/python/mean_squared_error.py
diff --git a/deep_learning/python/neuralnetwork.py → ...ing/deep_learning/python/neuralnetwork.py b/deep_learning/python/neuralnetwork.py → ...ing/deep_learning/python/neuralnetwork.py
diff --git a/...tion/Image Classifier Project_colab.ipynb → ...tion/Image Classifier Project_colab.ipynb b/...tion/Image Classifier Project_colab.ipynb → ...tion/Image Classifier Project_colab.ipynb
diff --git a/...n/pytorch-flower-classification/README.md → ...n/pytorch-flower-classification/README.md b/...n/pytorch-flower-classification/README.md → ...n/pytorch-flower-classification/README.md
diff --git a/...-flower-classification/assets/Flowers.png → ...-flower-classification/assets/Flowers.png b/...-flower-classification/assets/Flowers.png → ...-flower-classification/assets/Flowers.png
diff --git a/...assification/assets/inference_example.png → ...assification/assets/inference_example.png b/...assification/assets/inference_example.png → ...assification/assets/inference_example.png
diff --git a/...ch-flower-classification/cat_to_name.json → ...ch-flower-classification/cat_to_name.json b/...ch-flower-classification/cat_to_name.json → ...ch-flower-classification/cat_to_name.json
diff --git a/deep_learning/python/rnn/generate.py → ...ning/deep_learning/python/rnn/generate.py b/deep_learning/python/rnn/generate.py → ...ning/deep_learning/python/rnn/generate.py
diff --git a/deep_learning/python/rnn/input.txt → ...arning/deep_learning/python/rnn/input.txt b/deep_learning/python/rnn/input.txt → ...arning/deep_learning/python/rnn/input.txt
diff --git a/deep_learning/python/rnn/rnn.py → ..._learning/deep_learning/python/rnn/rnn.py b/deep_learning/python/rnn/rnn.py → ..._learning/deep_learning/python/rnn/rnn.py
diff --git a/deep_learning/python/rnn/tokens.py → ...arning/deep_learning/python/rnn/tokens.py b/deep_learning/python/rnn/tokens.py → ...arning/deep_learning/python/rnn/tokens.py
diff --git a/deep_learning/python/rnn/train.py → ...earning/deep_learning/python/rnn/train.py b/deep_learning/python/rnn/train.py → ...earning/deep_learning/python/rnn/train.py
diff --git a/deep_learning/python/rnn/uwv.pkl → ...learning/deep_learning/python/rnn/uwv.pkl b/deep_learning/python/rnn/uwv.pkl → ...learning/deep_learning/python/rnn/uwv.pkl
diff --git a/deep_learning/python/rnn_google_stock.py → .../deep_learning/python/rnn_google_stock.py b/deep_learning/python/rnn_google_stock.py → .../deep_learning/python/rnn_google_stock.py
diff --git a/...fer-learning/image/transfer-learning.jpeg → ...fer-learning/image/transfer-learning.jpeg b/...fer-learning/image/transfer-learning.jpeg → ...fer-learning/image/transfer-learning.jpeg
diff --git a/...ng/image/transfer_learning_tutorial.ipynb → ...ng/image/transfer_learning_tutorial.ipynb b/...ng/image/transfer_learning_tutorial.ipynb → ...ng/image/transfer_learning_tutorial.ipynb
diff --git a/...ansfer-learning/model/preprocessing.ipynb → ...ansfer-learning/model/preprocessing.ipynb b/...ansfer-learning/model/preprocessing.ipynb → ...ansfer-learning/model/preprocessing.ipynb
diff --git a/.../python/transfer-learning/model/readme.md → .../python/transfer-learning/model/readme.md b/.../python/transfer-learning/model/readme.md → .../python/transfer-learning/model/readme.md
diff --git a/...thon/transfer-learning/model/script.ipynb → ...thon/transfer-learning/model/script.ipynb b/...thon/transfer-learning/model/script.ipynb → ...thon/transfer-learning/model/script.ipynb
diff --git a/...arning/python/transfer-learning/readme.md → ...arning/python/transfer-learning/readme.md b/...arning/python/transfer-learning/readme.md → ...arning/python/transfer-learning/readme.md
@@ -1,11 +1,11 @@
-# Transfer Learning
-In Transfer Learning, the knowledge of an already trained Machine Learning model is applied to a different but related problem. For
-example, if you trained a simple classifier to predict whether an image contains a backpack, you could use the knowledge that the 
-model gained during its training to recognize other objects like sunglasses. With transfer learning, we basically try to exploit 
-what has been learned in one task to improve generalization in another. We transfer the weights that a Network has learned at Task 
-A to a new Task B.<br>
-The general idea is to use knowledge, that a model has learned from a task where a lot of labeled training data is available, in a 
-new task where we don’t have a lot of data. Instead of starting the learning process from scratch, you start from patterns that 
-have been learned from solving a related task. Transfer Learning is mostly used in Computer Vision and Natural Language Processing 
-Tasks like Sentiment Analysis, because of the huge amount of computational power that is needed for them.
-![alt workflow](https://github.com/BAJUKA/al-go-rithms/blob/master/deep_learning/python/transfer-learning/image/transfer-learning.jpeg)
+# Transfer Learning
+In Transfer Learning, the knowledge of an already trained Machine Learning model is applied to a different but related problem. For
+example, if you trained a simple classifier to predict whether an image contains a backpack, you could use the knowledge that the 
+model gained during its training to recognize other objects like sunglasses. With transfer learning, we basically try to exploit 
+what has been learned in one task to improve generalization in another. We transfer the weights that a Network has learned at Task 
+A to a new Task B.<br>
+The general idea is to use knowledge, that a model has learned from a task where a lot of labeled training data is available, in a 
+new task where we don’t have a lot of data. Instead of starting the learning process from scratch, you start from patterns that 
+have been learned from solving a related task. Transfer Learning is mostly used in Computer Vision and Natural Language Processing 
+Tasks like Sentiment Analysis, because of the huge amount of computational power that is needed for them.
+![alt workflow](https://github.com/BAJUKA/al-go-rithms/blob/master/deep_learning/python/transfer-learning/image/transfer-learning.jpeg)
diff --git a/...ation-algos/Frequent Pattern mining.ipynb → ...ation-algos/Frequent Pattern mining.ipynb b/...ation-algos/Frequent Pattern mining.ipynb → ...ation-algos/Frequent Pattern mining.ipynb
diff --git a/recommendation-algos/README.md → ...e_learning/recommendation-algos/README.md b/recommendation-algos/README.md → ...e_learning/recommendation-algos/README.md
diff --git a/...alysis_twitter/Deep Learning/Data/gop.csv → ...alysis_twitter/Deep Learning/Data/gop.csv b/...alysis_twitter/Deep Learning/Data/gop.csv → ...alysis_twitter/Deep Learning/Data/gop.csv
diff --git a/..._analysis_twitter/Deep Learning/README.md → ..._analysis_twitter/Deep Learning/README.md b/..._analysis_twitter/Deep Learning/README.md → ..._analysis_twitter/Deep Learning/README.md
diff --git a/...is_twitter/Deep Learning/sentiment_cnn.py → ...is_twitter/Deep Learning/sentiment_cnn.py b/...is_twitter/Deep Learning/sentiment_cnn.py → ...is_twitter/Deep Learning/sentiment_cnn.py
@@ -1,50 +1,50 @@
-import numpy as np
-import pandas as pd
-from keras.layers import Input, Dense, Bidirectional, Embedding, Dropout, Flatten
-from keras.layers import concatenate, SpatialDropout1D, GlobalAveragePooling1D, GlobalMaxPooling1D
-from keras.layers.convolutional import Conv1D
-from keras.layers.convolutional import MaxPooling1D
-from keras.models import Model
-from sklearn.model_selection import train_test_split
-from utils import *
-
-
-maxlen = 150
-max_features = 2500
-
-
-gop = pd.read_csv('Data/gop.csv')
-data = gop[['text','sentiment']]
-
-# Balance Negative - Positive tweets
-data[data['sentiment'] == 'Negative'] = data[data['sentiment'] == 'Negative'][:2236]
-data = data.dropna()
-
-data['sentiment'].value_counts() #Negative: 8493; Neutral: 3142; Positive: 2236
-X, Y = format_data(data, max_features, maxlen)
-X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.25, random_state=42)
-
-
-# Input shape
-inp = Input(shape=(maxlen,))
-
-# Embedding and CNN
-x = Embedding(max_features, 150)(inp)
-x = SpatialDropout1D(0.25)(x)
-x = Conv1D(filters=32, kernel_size=3, padding='same', activation='relu')(x)
-x = MaxPooling1D(pool_size=2)(x)
-x = Conv1D(filters=16, kernel_size=5, padding='same', activation='relu')(x)
-x = MaxPooling1D(pool_size=4)(x)
-x = Flatten()(x)
-
-# Output layer
-output = Dense(1, activation='sigmoid')(x)
-
-model = Model(inputs=inp, outputs=output)
-model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
-
-
-model.fit(X_train, Y_train, epochs=5, batch_size=32, verbose=1)
-
-results = model.predict(X_test, batch_size=1, verbose=1)
-run_test(results, Y_test)
+import numpy as np
+import pandas as pd
+from keras.layers import Input, Dense, Bidirectional, Embedding, Dropout, Flatten
+from keras.layers import concatenate, SpatialDropout1D, GlobalAveragePooling1D, GlobalMaxPooling1D
+from keras.layers.convolutional import Conv1D
+from keras.layers.convolutional import MaxPooling1D
+from keras.models import Model
+from sklearn.model_selection import train_test_split
+from utils import *
+
+
+maxlen = 150
+max_features = 2500
+
+
+gop = pd.read_csv('Data/gop.csv')
+data = gop[['text','sentiment']]
+
+# Balance Negative - Positive tweets
+data[data['sentiment'] == 'Negative'] = data[data['sentiment'] == 'Negative'][:2236]
+data = data.dropna()
+
+data['sentiment'].value_counts() #Negative: 8493; Neutral: 3142; Positive: 2236
+X, Y = format_data(data, max_features, maxlen)
+X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.25, random_state=42)
+
+
+# Input shape
+inp = Input(shape=(maxlen,))
+
+# Embedding and CNN
+x = Embedding(max_features, 150)(inp)
+x = SpatialDropout1D(0.25)(x)
+x = Conv1D(filters=32, kernel_size=3, padding='same', activation='relu')(x)
+x = MaxPooling1D(pool_size=2)(x)
+x = Conv1D(filters=16, kernel_size=5, padding='same', activation='relu')(x)
+x = MaxPooling1D(pool_size=4)(x)
+x = Flatten()(x)
+
+# Output layer
+output = Dense(1, activation='sigmoid')(x)
+
+model = Model(inputs=inp, outputs=output)
+model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
+
+
+model.fit(X_train, Y_train, epochs=5, batch_size=32, verbose=1)
+
+results = model.predict(X_test, batch_size=1, verbose=1)
+run_test(results, Y_test)
diff --git a/..._twitter/Deep Learning/sentiment_utils.py → ..._twitter/Deep Learning/sentiment_utils.py b/..._twitter/Deep Learning/sentiment_utils.py → ..._twitter/Deep Learning/sentiment_utils.py
@@ -1,59 +1,59 @@
-import pandas as pd
-import numpy as np
-from keras.preprocessing.text import Tokenizer
-from keras.preprocessing.sequence import pad_sequences
-
-
-
-def format_data(data, max_features, maxlen):
-    data = data[data.sentiment != "Neutral"]
-    data = data.sample(frac=1).reset_index(drop=True)
-    data['text'] = data['text'].apply(lambda x: x.lower())
-
-    Y = to_numerical(data['sentiment'].values) # 0: Negative; 1: Positive
-    X = data['text']
-
-    remove_rt_url(X)
-
-    tokenizer = Tokenizer(num_words=max_features)
-    tokenizer.fit_on_texts(list(X))
-
-    X = tokenizer.texts_to_sequences(X)
-    X = pad_sequences(X, maxlen=maxlen)
-
-    return X, Y
-
-
-def to_numerical(d):
-    """Converts the categorical df[col] to numerical"""
-    _, d = np.unique(d, return_inverse=True)
-    return d
-
-
-def run_test(results, Y_validate):
-    pos_correct, neg_correct, total_correct = 0, 0, 0
-    _, (neg_count, pos_count) = np.unique(Y_validate, return_counts=True)
-
-    for i, r in enumerate(results):
-        if r > 0.5:
-            r = 1
-        else:
-            r = 0
-
-        if r == Y_validate[i]:
-            total_correct += 1
-            if r == 0:
-                neg_correct += 1
-            else:
-                pos_correct += 1
-
-
-    print('Positive Accuracy:', pos_correct/pos_count * 100, '%')
-    print('Negative Accuracy:', neg_correct/neg_count * 100, '%')
-    print('Total Accuracy:', total_correct/(pos_count + neg_count) * 100, '%')
-
-
-def remove_rt_url(df):
-    url = r'((https?):((//)|(\\\\))+([\w\d:#@%/;$()~_?\+-=\\\.&](#!)?)*)'
-    df.replace(regex=True, inplace=True, to_replace=r'^RT ', value=r'')
+import pandas as pd
+import numpy as np
+from keras.preprocessing.text import Tokenizer
+from keras.preprocessing.sequence import pad_sequences
+
+
+
+def format_data(data, max_features, maxlen):
+    data = data[data.sentiment != "Neutral"]
+    data = data.sample(frac=1).reset_index(drop=True)
+    data['text'] = data['text'].apply(lambda x: x.lower())
+
+    Y = to_numerical(data['sentiment'].values) # 0: Negative; 1: Positive
+    X = data['text']
+
+    remove_rt_url(X)
+
+    tokenizer = Tokenizer(num_words=max_features)
+    tokenizer.fit_on_texts(list(X))
+
+    X = tokenizer.texts_to_sequences(X)
+    X = pad_sequences(X, maxlen=maxlen)
+
+    return X, Y
+
+
+def to_numerical(d):
+    """Converts the categorical df[col] to numerical"""
+    _, d = np.unique(d, return_inverse=True)
+    return d
+
+
+def run_test(results, Y_validate):
+    pos_correct, neg_correct, total_correct = 0, 0, 0
+    _, (neg_count, pos_count) = np.unique(Y_validate, return_counts=True)
+
+    for i, r in enumerate(results):
+        if r > 0.5:
+            r = 1
+        else:
+            r = 0
+
+        if r == Y_validate[i]:
+            total_correct += 1
+            if r == 0:
+                neg_correct += 1
+            else:
+                pos_correct += 1
+
+
+    print('Positive Accuracy:', pos_correct/pos_count * 100, '%')
+    print('Negative Accuracy:', neg_correct/neg_count * 100, '%')
+    print('Total Accuracy:', total_correct/(pos_count + neg_count) * 100, '%')
+
+
+def remove_rt_url(df):
+    url = r'((https?):((//)|(\\\\))+([\w\d:#@%/;$()~_?\+-=\\\.&](#!)?)*)'
+    df.replace(regex=True, inplace=True, to_replace=r'^RT ', value=r'')
     df.replace(regex=True, inplace=True, to_replace=url, value=r'')
diff --git a/sentiment_analysis_twitter/README.md → ...ning/sentiment_analysis_twitter/README.md b/sentiment_analysis_twitter/README.md → ...ning/sentiment_analysis_twitter/README.md
diff --git a/...ysis_twitter/python/sentiment_analysis.py → ...ysis_twitter/python/sentiment_analysis.py b/...ysis_twitter/python/sentiment_analysis.py → ...ysis_twitter/python/sentiment_analysis.py
diff --git a/...ng_kMeans/TextClusteringUsingKMeans.ipynb → ...ng_kMeans/TextClusteringUsingKMeans.ipynb b/...ng_kMeans/TextClusteringUsingKMeans.ipynb → ...ng_kMeans/TextClusteringUsingKMeans.ipynb