From 4089674470ea195eade950a3c955b3acbe0df4cc Mon Sep 17 00:00:00 2001
From: Jean N'dah Kouagou <jeank@aims.ac.za>
Date: Wed, 12 Feb 2020 09:49:46 +0000
Subject: [PATCH] leetcode

---
 .../Jean_Ndah_FML_project-checkpoint.ipynb    | 2579 +++++++++++++++++
 ...inary_search_from_scratch-checkpoint.ipynb |  115 +
 LeetcodeExercises.ipynb                       |  285 ++
 3 files changed, 2979 insertions(+)
 create mode 100644 .ipynb_checkpoints/Jean_Ndah_FML_project-checkpoint.ipynb
 create mode 100644 .ipynb_checkpoints/My_binary_search_from_scratch-checkpoint.ipynb
 create mode 100644 LeetcodeExercises.ipynb

diff --git a/.ipynb_checkpoints/Jean_Ndah_FML_project-checkpoint.ipynb b/.ipynb_checkpoints/Jean_Ndah_FML_project-checkpoint.ipynb
new file mode 100644
index 0000000..ad52056
--- /dev/null
+++ b/.ipynb_checkpoints/Jean_Ndah_FML_project-checkpoint.ipynb
@@ -0,0 +1,2579 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# $~~~~~~~~~~~~~~~~~~~~\\color{black}{\\text{Jean N'dah Kouagou}}$"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "\n",
+    "###  $~~~~~~~~~~~~~~~~~\\color{blue}{\\text{Foundation of Machine Learning}} $\n",
+    "\n",
+    "#### $~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ \\color{green}{\\underline{\\text{Project 1}}}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{black}{\\text{Introduction}}$\n",
+    "\n",
+    "In this project, we implement three machine learning algorithms: Naive Bayes, Softmax Logistic Regression and Gaussian Discriminant Analysis. The three algorithms are used for classificaction and are tested on the same data set for comparison. Some nice observations have been made which we summarise at the bottom of this notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#!pip3 install progress_bar"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np, pandas as pd, seaborn as sns, progress_bar as pb"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from sklearn.preprocessing import LabelEncoder as le\n",
+    "from sklearn.feature_extraction.text import CountVectorizer\n",
+    "from sklearn.model_selection import train_test_split"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Naive Bayes"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class Naive_Bayes(object):\n",
+    "    def __init__(self):\n",
+    "        pass\n",
+    "    \n",
+    "    def Phi_ki(self, i, k):\n",
+    "        \"\"\"This function is a method to compute the probabilities P(X^(i)=1/y=k)\"\"\"\n",
+    "        Res1=np.sum((self.features.iloc[:, i] == 1) & (self.target==k))+1 # adding 1 for \n",
+    "        #Laplace smoothing\n",
+    "        Res2=np.sum(self.target==k)\n",
+    "        Res3=self.target.nunique()# considering Res3 in the denominator still for\n",
+    "        #Laplace smoothing\n",
+    "        return Res1/(Res2+Res3)\n",
+    "    \n",
+    "    def train(self, features, target): \n",
+    "        # Providing data for training\n",
+    "        self.features=features\n",
+    "        self.target=target\n",
+    "        # Computing the probabilities P(y=k)\n",
+    "        self.p_y_s=np.array([np.sum(self.target==j)/len(self.target) for j in \\\n",
+    "                          np.unique(self.target)])\n",
+    "        #Here we compute the probabilities P(X^(i)=1/y=k)\n",
+    "        phi_i_k_s=np.array([[self.Phi_ki(i, k) for k in np.unique(self.target)]\\\n",
+    "                        for i in range(self.features.shape[1])])\n",
+    "        self.phi_i_k_s=phi_i_k_s\n",
+    "\n",
+    "    def P_Xi_given_y(self, i, k, X):\n",
+    "        \"\"\"This function computes P(X^(i)/y=k). Since X^(i)/y=k follows Bernouli distribution\n",
+    "        phi_k^(i), we then return the following:\"\"\"\n",
+    "        return self.phi_i_k_s[i][k]**(X[i])*(1-self.phi_i_k_s[i][k])**\\\n",
+    "                    (1-X[i])\n",
+    "        \n",
+    "    \n",
+    "    def P_y_equal_k_given_X(self, k, X):\n",
+    "        \"\"\"This function computes P(y=k/X) and will be used to predict a class\"\"\"\n",
+    "        Res1=np.prod([self.P_Xi_given_y(i, k, X) for i in range(len(X))])\n",
+    "        Res2=self.p_y_s[k]\n",
+    "        return Res1*Res2\n",
+    "    \n",
+    "    def predict(self, X):\n",
+    "        \"\"\"This function uses the above function for the predictions\"\"\"\n",
+    "        predictions=[]\n",
+    "        bar = pb.ProgressBar(\"predictions\", offset=2, total_width=100, min_value=0, \\\n",
+    "                             max_value=X.shape[0]-1)\n",
+    "        for j in range(X.shape[0]):\n",
+    "            bar(j)\n",
+    "            List=[]\n",
+    "            for k in np.unique(self.target):\n",
+    "                List.append(self.P_y_equal_k_given_X(k, X.iloc[j, :]))\n",
+    "            predictions.append(np.argmax(List))\n",
+    "        return np.array(predictions)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Gaussian Discriminant Analysis"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class GDAMulticlass(object):\n",
+    "    \n",
+    "    def __init__(self, regularizer=0.1):\n",
+    "        # The regularizer will allow us avoid singular matrices during the computations\n",
+    "        self.regularizer=regularizer\n",
+    "        \n",
+    "    def train(self, features, target):\n",
+    "        self.features=features\n",
+    "        self.target=target\n",
+    "        self.number_features=self.features.shape[1]\n",
+    "        combined=pd.concat([features, target], axis=1)\n",
+    "        # We compute the parameters mu_k associated with each class\n",
+    "        self.mu_s=[combined[combined['target']==j].drop('target', axis=1).mean(axis=0)\\\n",
+    "                   for j in np.unique(self.target)]\n",
+    "        # And here are the parameters phi_k associated with each class\n",
+    "        self.phi_s=(1.0/len(self.target))*np.array([self.target[self.target==j].count() \\\n",
+    "                                    for j in np.unique(target)])\n",
+    "        \n",
+    "        # Finally, we compute the matrix sigma\n",
+    "        sigma=np.matrix(np.zeros([self.number_features, self.number_features]))\n",
+    "        \n",
+    "        bar = pb.ProgressBar(\"training\", offset=2, total_width=100, min_value=0,\\\n",
+    "        max_value=self.target.shape[0]-1) # This tracks the progression of the computation\n",
+    "        #of sigma\n",
+    "        for i in range(self.target.shape[0]):\n",
+    "            bar(i)\n",
+    "            sigma += np.dot(np.matrix(self.features.iloc[i, :]-\\\n",
+    "            self.mu_s[int(self.target.iloc[i])]).T, \\\n",
+    "            np.matrix(self.features.iloc[i, :]-self.mu_s[int(self.target.iloc[i])]))\n",
+    "        \n",
+    "        self.sigma=(1.0/self.target.shape[0])*sigma\n",
+    "    \n",
+    "    def P_x_given_y(self, sigma, x, mu):\n",
+    "        # The following if condition helps to avoid overflow in the computation of the \n",
+    "        #exponential when its parameter is too large\n",
+    "        if self.number_features>380:\n",
+    "            #The following is to avoid singular matrices\n",
+    "            if np.linalg.det(sigma)==0:\n",
+    "                sigma=sigma+self.regularizer*np.eye(self.number_features)\n",
+    "                comp1 = 1.0/(np.sqrt((2*np.pi)**380)*np.sqrt(np.linalg.det(sigma)))\n",
+    "                comp2 = float(np.exp(np.dot(-0.5*np.dot(x-mu, np.linalg.inv(sigma)), x-mu)))\n",
+    "            else:\n",
+    "                comp1 = 1.0/(np.sqrt((2*np.pi)**380)*np.sqrt(np.linalg.det(sigma)))\n",
+    "                comp2 = float(np.exp(np.dot(-0.5*np.dot(x-mu, np.linalg.inv(sigma)), x-mu)))\n",
+    "        else:\n",
+    "            if np.linalg.det(sigma)==0:\n",
+    "                sigma=sigma+self.regularizer*np.eye(self.number_features)\n",
+    "                comp1 = 1.0/(np.sqrt((2*np.pi)**self.features.shape[1])*\\\n",
+    "                             np.sqrt(np.linalg.det(sigma)))\n",
+    "                comp2 = float(np.exp(np.dot(-0.5*np.dot(x-mu, np.linalg.inv(sigma)), x-mu)))\n",
+    "            else:\n",
+    "                comp1 = 1.0/(np.sqrt((2*np.pi)**self.features.shape[1])*\\\n",
+    "                             np.sqrt(np.linalg.det(sigma)))\n",
+    "                comp2 = float(np.exp(np.dot(-0.5*np.dot(x-mu, np.linalg.inv(sigma)), x-mu)))\n",
+    "            \n",
+    "        return comp1*comp2\n",
+    "        \n",
+    "    def predict(self, X):\n",
+    "        predictions=[]\n",
+    "        bar = pb.ProgressBar(\"predictions\", offset=2, total_width=100, min_value=0, \\\n",
+    "                                                        max_value=X.shape[0]-1)\n",
+    "        for i in range(X.shape[0]):\n",
+    "            bar(i)\n",
+    "            Prob=[self.P_x_given_y(self.sigma, X.iloc[i, :], self.mu_s[j])*self.phi_s[j]\\\n",
+    "                  for j in np.unique(self.target)]\n",
+    "            \n",
+    "            predictions.append(np.argmax(Prob))\n",
+    "            \n",
+    "        return np.array(predictions)\n",
+    "            "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Multiclass Logistic Regression"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class MulticlassLogReg(object):\n",
+    "    def __init__(self, lr=0.2, Max_iter=30):\n",
+    "        self.lr=lr\n",
+    "        self.Max_iter=Max_iter\n",
+    "       \n",
+    "    #Definition of the softmax function\n",
+    "    def softmax(self, k, X):\n",
+    "        return np.exp(X[k])/np.sum([np.exp(X[j]) for j in range(len(X))])\n",
+    "    \n",
+    "    #Function to compute the probability of (y=k/X_i; weights)\n",
+    "    def prob_yequal_k_given_Xi_weights(self, X_i, k, Weights):\n",
+    "        return self.softmax(k, [np.dot(Weights[l], X_i) for l in range(len(Weights))])\n",
+    "    \n",
+    "    # Function to compute the gradient associated to the target k\n",
+    "    def get_gradient(self, k, Weights, X, y):\n",
+    "        grad_k=-np.array([((y.iloc[i]==k)-self.prob_yequal_k_given_Xi_weights(X.iloc[i, :], k, Weights))\\\n",
+    "                 *X.iloc[i, :] for i in range(X.shape[0])]).mean(axis=0)\n",
+    "        return grad_k\n",
+    "    \n",
+    "    def fit(self, features, target, weights):\n",
+    "        self.target=target\n",
+    "        self.weights=weights\n",
+    "        Intercept=np.ones_like(self.target).reshape(-1,1)\n",
+    "        features=pd.DataFrame(np.concatenate([Intercept, features], axis=1))\n",
+    "        \n",
+    "        num_iter=0\n",
+    "        #To track the progress of the training process\n",
+    "        bar=pb.ProgressBar(\"training\", offset=2, total_width=100,\\\n",
+    "                            min_value=0, max_value=self.Max_iter-1)\n",
+    "        \n",
+    "        while (num_iter<self.Max_iter):\n",
+    "            bar(num_iter)\n",
+    "            previous_weights=self.weights.copy()\n",
+    "            for j in range(self.weights.shape[0]):\n",
+    "                #We update each weight\n",
+    "                self.weights[j]=self.weights[j]-self.lr*self.get_gradient(j, self.weights,\\\n",
+    "                                    features, target)\n",
+    "            num_iter += 1\n",
+    "            \n",
+    "    def predict(self, X_):\n",
+    "         #We first add the intercept column\n",
+    "        Intercept=np.ones(X_.shape[0]).reshape(-1,1)\n",
+    "        X=pd.DataFrame(np.concatenate([Intercept, X_], axis=1))\n",
+    "        \n",
+    "        predictions=[]\n",
+    "        # To track the prediction progress\n",
+    "        bar = pb.ProgressBar(\"predictions\", offset=2, total_width=100,\\\n",
+    "                            min_value=0, max_value=X.shape[0]-1)\n",
+    "        for i in range(X.shape[0]):\n",
+    "            bar(i)\n",
+    "            \n",
+    "            probs=[]\n",
+    "            # Here we compute the probabilties for y to be a given target\n",
+    "            for k in np.unique(self.target):\n",
+    "                probs.append(self.prob_yequal_k_given_Xi_weights(X.iloc[i, :], k, self.weights))\n",
+    "            # Now we choose the target with the highest probability\n",
+    "            predictions.append(np.argmax(probs))\n",
+    "        return np.array(predictions)  "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "#  Data to use for the project"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Data_train=pd.read_table('drugLibTrain_raw.tsv')\n",
+    "Data_test=pd.read_table('drugLibTest_raw.tsv')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Totaldata=pd.concat([Data_train, Data_test], axis=0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Unnamed: 0</th>\n",
+       "      <th>urlDrugName</th>\n",
+       "      <th>rating</th>\n",
+       "      <th>effectiveness</th>\n",
+       "      <th>sideEffects</th>\n",
+       "      <th>condition</th>\n",
+       "      <th>benefitsReview</th>\n",
+       "      <th>sideEffectsReview</th>\n",
+       "      <th>commentsReview</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>2202</td>\n",
+       "      <td>enalapril</td>\n",
+       "      <td>4</td>\n",
+       "      <td>Highly Effective</td>\n",
+       "      <td>Mild Side Effects</td>\n",
+       "      <td>management of congestive heart failure</td>\n",
+       "      <td>slowed the progression of left ventricular dys...</td>\n",
+       "      <td>cough, hypotension , proteinuria, impotence , ...</td>\n",
+       "      <td>monitor blood pressure , weight and asses for ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>3117</td>\n",
+       "      <td>ortho-tri-cyclen</td>\n",
+       "      <td>1</td>\n",
+       "      <td>Highly Effective</td>\n",
+       "      <td>Severe Side Effects</td>\n",
+       "      <td>birth prevention</td>\n",
+       "      <td>Although this type of birth control has more c...</td>\n",
+       "      <td>Heavy Cycle, Cramps, Hot Flashes, Fatigue, Lon...</td>\n",
+       "      <td>I Hate This Birth Control, I Would Not Suggest...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>1146</td>\n",
+       "      <td>ponstel</td>\n",
+       "      <td>10</td>\n",
+       "      <td>Highly Effective</td>\n",
+       "      <td>No Side Effects</td>\n",
+       "      <td>menstrual cramps</td>\n",
+       "      <td>I was used to having cramps so badly that they...</td>\n",
+       "      <td>Heavier bleeding and clotting than normal.</td>\n",
+       "      <td>I took 2 pills at the onset of my menstrual cr...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   Unnamed: 0       urlDrugName  rating     effectiveness  \\\n",
+       "0        2202         enalapril       4  Highly Effective   \n",
+       "1        3117  ortho-tri-cyclen       1  Highly Effective   \n",
+       "2        1146           ponstel      10  Highly Effective   \n",
+       "\n",
+       "           sideEffects                               condition  \\\n",
+       "0    Mild Side Effects  management of congestive heart failure   \n",
+       "1  Severe Side Effects                        birth prevention   \n",
+       "2      No Side Effects                        menstrual cramps   \n",
+       "\n",
+       "                                      benefitsReview  \\\n",
+       "0  slowed the progression of left ventricular dys...   \n",
+       "1  Although this type of birth control has more c...   \n",
+       "2  I was used to having cramps so badly that they...   \n",
+       "\n",
+       "                                   sideEffectsReview  \\\n",
+       "0  cough, hypotension , proteinuria, impotence , ...   \n",
+       "1  Heavy Cycle, Cramps, Hot Flashes, Fatigue, Lon...   \n",
+       "2         Heavier bleeding and clotting than normal.   \n",
+       "\n",
+       "                                      commentsReview  \n",
+       "0  monitor blood pressure , weight and asses for ...  \n",
+       "1  I Hate This Birth Control, I Would Not Suggest...  \n",
+       "2  I took 2 pills at the onset of my menstrual cr...  "
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "Totaldata.head(3)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<matplotlib.axes._subplots.AxesSubplot at 0x7f20ec95a668>"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    },
+    {
+     "data": {
+      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAX0AAAEKCAYAAAD+XoUoAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvOIA7rQAAIABJREFUeJzt3Xl8VfWd//HXJzcLWYGEsIWEBAiyKmAElLq0blhbsYu/unXsdHFsdexMnZnqrx07dX7tr8vM/Kad2lZqbae2lFrrtNTBolYd3ECCCLJKCJCELYEkJCFkvZ/fH7na2xjIzXqT3Pfz8eDhPed+vzefI+Gdk+/5nu8xd0dERGJDXLQLEBGRwaPQFxGJIQp9EZEYotAXEYkhCn0RkRii0BcRiSEKfRGRGKLQFxGJIQp9EZEYEh/tAjobN26c5+fnR7sMEZFhZfPmzcfdPbu7dhGFvpktB74DBICH3f0bZ2j3UeDXwAXuXhzadx/wKaAduNvd153ta+Xn51NcXBxJWSIiEmJmByNp123om1kAeBC4EqgANpnZGnff2aldOnA3sDFs3xzgRmAuMBl41sxmunt7pAciIiL9J5Ix/cVAibuXunsLsBpY0UW7fwa+BTSF7VsBrHb3ZnffD5SEPk9ERKIgktDPAcrDtitC+95hZguBXHd/sqd9RURk8EQS+tbFvnfWYzazOOD/Aff0tG/YZ9xuZsVmVlxVVRVBSSIi0huRhH4FkBu2PQU4HLadDswDXjCzA8BSYI2ZFUXQFwB3X+nuRe5elJ3d7cVnERHppUhCfxNQaGYFZpZIx4XZNW+/6e4n3X2cu+e7ez6wAbguNHtnDXCjmSWZWQFQCLzW70chIiIR6Xb2jru3mdldwDo6pmw+4u47zOwBoNjd15yl7w4zewzYCbQBd2rmjohI9NhQe1xiUVGRa56+iEjPmNlmdy/qrp2WYRARiSFDbhkGEZEzWbWxrNd9b16S14+VDF860xcRiSEKfRGRGKLQFxGJIQp9EZEYotAXEYkhCn0RkRii0BcRiSEKfRGRGKLQFxGJIQp9EZEYotAXEYkhCn0RkRii0BcRiSEKfRGRGKLQFxGJIQp9EZEYElHom9lyM9tjZiVmdm8X799hZm+a2Rtm9pKZzQntzzez06H9b5jZD/v7AEREJHLdPjnLzALAg8CVQAWwyczWuPvOsGar3P2HofbXAf8GLA+9t8/dF/Rv2SIi0huRnOkvBkrcvdTdW4DVwIrwBu5eF7aZCgytp62LiAgQWejnAOVh2xWhfX/GzO40s33At4C7w94qMLMtZvY/ZnZxn6oVEZE+iST0rYt97zqTd/cH3X068EXgy6HdR4A8d18IfAFYZWYZ7/oCZrebWbGZFVdVVUVevYiI9EgkoV8B5IZtTwEOn6X9auB6AHdvdvcTodebgX3AzM4d3H2luxe5e1F2dnaktYuISA9FEvqbgEIzKzCzROBGYE14AzMrDNu8Ftgb2p8duhCMmU0DCoHS/ihcRER6rtvZO+7eZmZ3AeuAAPCIu+8wsweAYndfA9xlZlcArUANcFuo+yXAA2bWBrQDd7h79UAciIiIdK/b0Adw97XA2k777g97/fkz9PsN8Ju+FCgiIv1Hd+SKiMQQhb6ISAxR6IuIxBCFvohIDFHoi4jEEIW+iEgMUeiLiMQQhb6ISAxR6IuIxBCFvohIDFHoi4jEEIW+iEgMUeiLiMQQhb6ISAxR6IuIxBCFvohIDFHoi4jEEIW+iEgMiSj0zWy5me0xsxIzu7eL9+8wszfN7A0ze8nM5oS9d1+o3x4zu7o/ixcRkZ7pNvTNLAA8CFwDzAFuCg/1kFXuPt/dFwDfAv4t1HcOcCMwF1gOfD/0eSIiEgWRnOkvBkrcvdTdW4DVwIrwBu5eF7aZCnjo9Qpgtbs3u/t+oCT0eSIiEgXxEbTJAcrDtiuAJZ0bmdmdwBeAROB9YX03dOqb00Xf24HbAfLy8iKpW0T6waqNZb3qd/MS/TsdriI507cu9vm7drg/6O7TgS8CX+5h35XuXuTuRdnZ2RGUJCIivRFJ6FcAuWHbU4DDZ2m/Gri+l31FRGQARRL6m4BCMysws0Q6LsyuCW9gZoVhm9cCe0Ov1wA3mlmSmRUAhcBrfS9bRER6o9sxfXdvM7O7gHVAAHjE3XeY2QNAsbuvAe4ysyuAVqAGuC3Ud4eZPQbsBNqAO929fYCORUREuhHJhVzcfS2wttO++8Nef/4sfb8GfK23BYqISP/RHbkiIjFEoS8iEkMU+iIiMUShLyISQxT6IiIxRKEvIhJDFPoiIjFEoS8iEkMU+iIiMUShLyISQxT6IiIxRKEvIhJDFPoiIjFEoS8iEkMU+iIiMUShLyISQxT6IiIxJKLQN7PlZrbHzErM7N4u3v+Cme00s21m9kczmxr2XruZvRH6s6ZzXxERGTzdPi7RzALAg8CVQAWwyczWuPvOsGZbgCJ3bzSzzwLfAj4Weu+0uy/o57pFRKQXIjnTXwyUuHupu7cAq4EV4Q3c/Xl3bwxtbgCm9G+ZIiLSHyIJ/RygPGy7IrTvTD4FPBW2PcrMis1sg5ld34saRUSkn3Q7vANYF/u8y4ZmtwJFwKVhu/Pc/bCZTQOeM7M33X1fp363A7cD5OXlRVS4iIj0XCRn+hVAbtj2FOBw50ZmdgXwJeA6d29+e7+7Hw79txR4AVjYua+7r3T3Incvys7O7tEBiIhI5CI5098EFJpZAXAIuBG4ObyBmS0EHgKWu3tl2P6xQKO7N5vZOGAZHRd5RSRGrdpYFu0SYlq3oe/ubWZ2F7AOCACPuPsOM3sAKHb3NcC3gTTg12YGUObu1wGzgYfMLEjHbxXf6DTrR0REBlEkZ/q4+1pgbad994e9vuIM/V4B5velQBER6T+6I1dEJIYo9EVEYohCX0Qkhij0RURiiEJfRCSGKPRFRGKIQl9EJIYo9EVEYohCX0Qkhij0RURiiEJfRCSGKPRFRGKIQl9EJIYo9EVEYohCX0Qkhij0RURiiEJfRCSGKPRFRGJIRKFvZsvNbI+ZlZjZvV28/wUz22lm28zsj2Y2Ney928xsb+jPbf1ZvIiI9Ey3oW9mAeBB4BpgDnCTmc3p1GwLUOTu5wKPA98K9c0EvgIsARYDXzGzsf1XvoiI9EQkZ/qLgRJ3L3X3FmA1sCK8gbs/7+6Noc0NwJTQ66uBZ9y92t1rgGeA5f1TuoiI9FQkoZ8DlIdtV4T2ncmngKd60tfMbjezYjMrrqqqiqAkERHpjUhC37rY5102NLsVKAK+3ZO+7r7S3YvcvSg7OzuCkkREpDfiI2hTAeSGbU8BDnduZGZXAF8CLnX35rC+l3Xq+0JvChUROZuG5jZ2Halj15E6UpPiWTZ9HBNHj4p2WUNOJKG/CSg0swLgEHAjcHN4AzNbCDwELHf3yrC31gFfD7t4exVwX5+rFhEJaWxp44nXD7HrSB0OjE1JoKG5jc0Ha5gxPo2r5kxgytiUaJc5ZHQb+u7eZmZ30RHgAeARd99hZg8Axe6+ho7hnDTg12YGUObu17l7tZn9Mx0/OAAecPfqATkSEYk5lfVNPPrqQWpPt3LJzGzm54xm0uhRnG5t57X91byy7wQ/efkAd19eGO1Sh4xIzvRx97XA2k777g97fcVZ+j4CPNLbAkVEurL3WD2/3FRGIC6OT7+ngKlZqe+8l5IYz2XnjGdezmi+91wJv95czl9dMo24uK4uM8aWiEJfRIauVRvLol3CoNt9tI6fbzjI+PRRfPzCqYxNSeyy3bi0JD5w7iSe2HKIh18q5fZLpg9ypUOPlmEQkWGltKqBVRvLmDQ6mdsvmXbGwH/b+VPHMndyBt9et4fth04OUpVDl0JfRIaN8upGfrbhIJmpiXzionxGJQS67WNmfGhBDpmpidz7xDbcu5xxHjMU+iIyLByta+KnrxwgLSmeTy4rIDUp8tHplKR4Pn/5TLYfquP1spoBrHLoU+iLyJBXfaqFn7y8n/iA8cllBWQkJ/T4M65fOJn0pHgeffXgAFQ4fCj0RWRIqzvdyo9fKqWt3fnksgIyU88+hn8mKYnxfOT8Kax98yjHG5q77zBCKfRFZMiqb2rlkZf3c6qlnb9cls+EjL7dYXvr0qm0tAd5rLi8+8YjlEJfRIakmsYWVq4vpaaxhY8vndovd9XOGJ/GRdOz+MWGMtqDsXlBV6EvIkNOZX0TK9eXcqqljU8uK2B6dlq/ffbHl07lUO1pXthT2X3jEUihLyJDyt7KelauL6U96Hzm4ml/dqdtf7hizgQmZCTx6IbYvKCrO3JFpFuNzW3Unm6luS1IS1uQreW1zJqUTlJ89/PkI9UWDPLszmOs33uc7PQk/mLpVLLSkvrt89+WEIjjI4um8ND6UmobWxjTzc1dI41CPwr6ctv8zUvy+rESkTNrDzp7j9VTfLCG3UfrCB8C/89XD5AYiGPWpHSWFGSyfN4kFuaO6fXaNmUnTvHkm0eoqDnN4vxM3j9/EonxAzcQcdXciXz/hX28sKeK6xee7ZlQI49CX0Tepby6kV8Vl1N9qqVjbfoZ45iamUJifIDEgHFu7hi2VtSytbyWn75ygB+9uJ8JGUlcPXciV8yewJJpmd3+FuDuHDjRyPN7KimpbCAlMcDNi/OYlzN6wI/v3JzRZKcn8cyuYwp9EYld7s7L+06wbvtR0pPjuXlxHrMnZRDodAb//vmTeP/8SQDUNbXy3K5K1r55hMeKy/nZqwdJS4pn6bRMzpmYzswJ6eSMSaa13Wlua6f4QDX7j59iX1UDdU1tpCbFc828iSwpyBrQs/twcXHGFbPH8/utR2hpCw7a1x0KFPoiAkBre5BfbSpn55E65kzK4COLppCc2P2YfcaoBK5fmMP1C3Noam3n5ZLjPLvrGJsO1PD8nqoup0amJAaYnp3GjPFpnDdlTFRC9/JZE/jla+Vs3H+Ciwtj5zGtCn0RoS0YZNXGMt46Vs+18ydx0fQsQg9E6pFRCQEunz2By2dPAKC5rZ39x09x9GQTifFxJMUHeHFvFePSkojrxef3p2UzxjEqIY4/7qqMqdCPnd9pRKRL7UHnV5vK2XOsnhULclg2Y1yvAr8rSfEBZk3M4LJzxnPR9HGcP3Us49NHRT3wAZITA7xnRjbP7DwWUytvRhT6ZrbczPaYWYmZ3dvF+5eY2etm1mZmH+30XruZvRH6s6a/CheRvgu68/jmcnYcruPa+ZNYXJAZ7ZIG1ZVzxnOo9jS7j9ZHu5RB023om1kAeBC4BpgD3GRmczo1KwM+Aazq4iNOu/uC0J/r+liviPSjP+46xtaKk1w1ZwLLZoyLdjmD7n2zJmAGz+48Fu1SBk0kZ/qLgRJ3L3X3FmA1sCK8gbsfcPdtQHAAahSRAfDmoZM8v6eK8/PGcunM2BnTDpednsR5U8bwzC6FfrgcIHxJuorQvkiNMrNiM9tgZtf3qDoRGRCHa0/z+OZy8jJTWLFgcr+N4Q9Hl88az7aKk1Sfaol2KYMiktDv6ruhJ1c98ty9CLgZ+Hcze9eTic3s9tAPhuKqqqoefLSI9NSp5jZ+vvEgyQkBblmSR3wgtudzXDQjC4CNpSeiXMngiORvuwLIDdueAhyO9Au4++HQf0uBF4CFXbRZ6e5F7l6UnR2bv2aKDIagO48Vl1Pf1MatS6eSPqrnT6Aaac6dMoaUxACv7FPov20TUGhmBWaWCNwIRDQLx8zGmllS6PU4YBmws7fFikjfPL+7kr2VDXzw3Mn9sj79SJAQiOOC/Exe1Zl+B3dvA+4C1gG7gMfcfYeZPWBm1wGY2QVmVgHcADxkZjtC3WcDxWa2FXge+Ia7K/RFouCtY/U8t7uShbljuCB/bLTLGVIump5FSWUDlXVN0S5lwEV0R667rwXWdtp3f9jrTXQM+3Tu9wowv481ikgf1Ta28FhxOeMzklixICemL9x25aLpHdNVXy09wYoFI3sBtti+giMSA9qCQX75WsfjAW9ePDWmFheL1JzJGWSMiufVGBjX19++yAj31JtHKa85zYcXTSE7vf8fSjISBOKMJdOyYuJirkJfZATbWlHLq6UnWDY9i/mDsE79cHbhtCzKqhupqGmMdikDSqEvMkJV1jXxX68fYmpmCsvnTYp2OUPe2/P1R/oQj0JfZARqam3n5xvLSIiP48bFee96CIq828zx6WSlJir0RWR4cXd+83oF1aeauWlxLqOTdQNWJOLijKWhcf2RvNSyQl9khHlx73F2HK5j+dyJTBuXFu1yhpWl07M4WtdEWfXIHddX6IuMICWVDazbcZT5OaNjcqnkvloSep7Axv3VUa5k4Cj0RUaImsYWVm8qIzs9iQ8v0g1YvTEjO40xKQlsUuiLyFDW2t7xjNv2oHPLkqkkxXf/QHN5t7g444L8TF47oNAXkSHK3VnzxmEO1Z7mhvNzdQNWHy0pyOTgiUaOjdB1eBT6IsPcpgM1bC6r4b3nZDNncka0yxn2LsjvGNd/bYQO8Sj0RYaxbRW1/H7bYQrHp3H57AnRLmdEmDs5g5TEAJtG6BCPQl9kmKptbOGzP3+dtKR4/ldRLnG6cNsv4gNxnD91rM70RWToCAadv/nVG1TWN3Hz4jxSkyJaJV0itDg/kz3H6qltHHnPzVXoiwxD33+hhBf2VHH/B+aQm6knYPW3xQWZuEPxgZpol9LvFPoiw8zG0hP82zNvcd15k7l16dRolzMinZc7hsRA3IicuqnQFxlGTjQ0c/fqLUzNSuXrH56vG7AGyKiEAOfljh6R4/oRhb6ZLTezPWZWYmb3dvH+JWb2upm1mdlHO713m5ntDf25rb8KF4k1waDzt49tpaaxle/dvJA0jeMPqAvyM9l+6CSNLW3RLqVfdRv6ZhYAHgSuAeYAN5nZnE7NyoBPAKs69c0EvgIsARYDXzEzPZFZpBceWl/K+rc6xvHnTtYDUQba4oJM2oLO5oMja1w/kjP9xUCJu5e6ewuwGlgR3sDdD7j7NiDYqe/VwDPuXu3uNcAzwPJ+qFskprxeVsO/PL2Ha+dP4pYledEuJyYU5WcSiDM2lo6sIZ5IQj8HKA/brgjti0Rf+ooIUNfUyt2/3MLEjFEaxx9EaUnxzMsZzcb9I+uhKpGEflffYZE+YSCivmZ2u5kVm1lxVVVVhB8tMvK5O//7iTc5crKJ7960UA9EGWRLCzLZWn6Sptb2aJfSbyIJ/QogN2x7CnA4ws+PqK+7r3T3Incvys7OjvCjRUa+x4rLeXLbEb5w5UzOn6rLYYNtybRMWtqDvF42csb1Iwn9TUChmRWYWSJwI7Amws9fB1xlZmNDF3CvCu0TkW7sPVbPV9bs4KLpWdxx6fRolxOTivIziTNG1Lh+t6Hv7m3AXXSE9S7gMXffYWYPmNl1AGZ2gZlVADcAD5nZjlDfauCf6fjBsQl4ILRPRM6iqbWdu1ZtITUxnn//2AI92DxKMkYlMGdyBhtKR864fkQTfd19LbC20777w15vomPopqu+jwCP9KFGkR5btbGsV/1uHiIzY776+53sOVbPf35yMeMzRkW7nJi2pCCLRzccpKm1nVEJw//hNLojV2SIeXLbYX75Whl3XDqdS2fqGle0LSnIpKUtyNby2miX0i8U+iJDSEllPV98fBuL8sZwz1Uzo12O0HGTltnIeVi67uMW6Se9HVKCjmGlhuY2/urRzSQnBnjwlkUkBHRONhSMSUlk1sSM0Hz9wmiX02f6rhIZAtydv//1Vg6caOQ/blrEpNHJ0S5JwiwpyGTzwRpa2jovOjD8KPRFhoCH1pfy1Paj3Lt8FhdOz4p2OdLJ0mlZNLUGeWMEjOsr9KPgVHMb2w+d5OCJU7S2D/8zB+mb7YdO8s0/7Obacyfx6YsLol2OdOHC6VnEGby0d/ivGKAx/UHS3NbOj1/az9M7jrG1vPadtSgCZkwaM4rF+ZmcP3XskFxXpa9j1XJmB0+c4rHichbmjuFfbzhvSP79C4xOTuC83DGs33ucL1x1TrTL6ROF/iA4VtfEHT/fzJayWhbmjeF9s8czIzuNU83tlNc0sreynie2HGJLeS0fWpjDuLSkaJcsg6CqvpmfvXqQ0ckJPHzbBSNiDvhIdnFhNt97bi+1jS2MSUmMdjm9puGdAbalrIYP/sdL7Dlazw9uWcR/fW4Zl8+awNSsVOZMzuDquRP53GUz+NDCHI6cPM13/7h3RN39J12rPtXCT17ZT5zBJy7KJzN1+IZIrLikcBxBh1f2De9/nwr9AbTpQDUfe2gDoxICPPG5i7hm/qQu28WZcUF+Jn9zxUymZ6exZuthnt11DPdIFzOV4eR4fTM/erGU5tYgn7iogCz9ZjcsnJc7hvSkeF4c5uP6Cv0BcvRkE5/9+evkjE3md3cuY9bEjG77ZIxK4NalUzk/byzP7a5kzdbDBBX8I8qxuiZ+9GIpbe1BPn1xATljNTVzuEgIxHHh9CzWv3V8WJ+QKfQHQHNbO5/9xWZOt7Sx8uPnM7YHv7oH4owPL8rh4sJxbNxfzeObKxT8I0RJZQM/erEUDD598TTNxR+GLp6ZzaHa0xw40RjtUnpNF3IHwFd/v5MtZbX84JZFFE5I73F/M+OaeZNITgjw9M5jxMcZ1y/MIU4zO4Yld2f9W1U8vfMY2elJfHzpVA3pDFOXFI4D4MW9VRSMS41yNb2j0O9n/73tCKs2lvHZy6afcQw/UpedM57W9iDP76kiIRDHB87t2+fJ4KtvauW3bxxm15E6zp0ymg8vnEJivH7BHq6mZqWSl5nC+reO8xcX5ke7nF5R6Pejk42tfGXNDubnjOaeK/tnsawrZk+gpS3Iy/tOkBCI4+YleZrLPQwE3dlYeoKndx6jLehcO38SF03P0t/dCHBx4Th+u+UQre3BYbk+kkK/H33jD7upaWzhp395AfH99M1gZrx//iRag876vVX8+7N7+dt++oEy1PXlprBoCbqz83Adz++p5MjJJgrHp/HB8ybr3osR5OLCbH6xsYziAzXDcskMhX4/2XSgml++VsZnLi5gXs7ofv1sM+O68ybT3u585497SYyP4873zujXryF9c7yhmVf2HeeVfSeoPtVCZmoiN16Qy/yc0Tq7H2HeUziOxPg41u04qtCPVc1t7dz3xJvkjEkesLPwODM+tCiHvKwUvr1uD4E403NTo6iptZ2dR+p4/WANT+84RvHBaoIOuWOTWT43jzmTM3ThfYRKS4rn0pnZrNtxlPs/MIe4YfYoy4hC38yWA98BAsDD7v6NTu8nAT8DzgdOAB9z9wNmlk/Hc3X3hJpucPc7+qf0oePHL+2npLKBn3ziAlISB+7naJwZ3/7oubS2B/nGU7upbWzli8vP0ZlkP2kPOscbmqlvaqO+qZX6pjbqTrdS19RKTWMrR2pPc/hkE+XVjeytbKA92DGVdtbEdO56XyHBoDN5jKZhxoJr5k3kmZ3H2FpRy8K8sdEup0e6TSgzCwAPAlcCFcAmM1vj7jvDmn0KqHH3GWZ2I/BN4GOh9/a5+4J+rnvIqKxr4sHnSrhi9gTeO2v8gH+9x4orWDoti8q6Zn74P/t4bX81H1qY0+2Ds7XwWQd3p6q+mcMnm6isb6Kyrpmaxhbqm9o41dzGP/5u+xn7pifFM2nMKHLGJHPF7AnMyxnNebmj35lvPxyvQUjvXD57AgkB4w/bj4680AcWAyXuXgpgZquBFUB46K8A/in0+nHgexYjp5/fWreHlvYgX7529qB9zTgzViyYTNqoeJ7bXUlDcys3nJ9LapJG67pyoqGZ3UfrKT1+ioMnTtHY0g5AnEFWahKZqYlMGZtMWlICl52TTfqoeNJHJZCWFM/o5AQykuMZk5JImv7/Ssjo5AQumj6OtduPcO81s4bVb9uRfBfnAOVh2xXAkjO1cfc2MzsJvH2Fo8DMtgB1wJfd/cXOX8DMbgduB8jLGz5npNsqanl8cwV/dck08gf5Rg0z44rZE8gYlcDvtx7mP57byw1FuUzPThvUOoaioDsVNafZcfgku4/UU9XQDEBmasdj7/KzUpiSmcK4tETi4/58lpV+I5JIXTNvIvc+8SY7Dtf1++SNgRRJ6Hf1I6zzugBnanMEyHP3E2Z2PvBbM5vr7nV/1tB9JbASoKioaFisOeDufPX3OxmXlshd74veTJrFBZlMGZvM6k1lPPLSfi4uzOayc7JjbpnetmCQ/cdPsetIHTsP11HX1EbAjILsVJZMy2TWxAytZCn96qq5E/nSb7fzh+1HR1zoVwC5YdtTgMNnaFNhZvHAaKDaO1YlagZw981mtg+YCRT3tfBoW7P1MJsP1vDNj8wnfVRCVGuZPCaZO987gye3HWH93iqKD1Zz6cxslk7L6tebR1ragtQ3tdLcFqQ96LQHnUCckRQfR1JCgNTEQL/dnxCJ2sYWSiobKKlq4K1j9TS1BkkIGIXj05mXk8E5EzJIToytH34yeDJTE1lSkMlT24/wd1cPnwerRBL6m4BCMysADgE3Ajd3arMGuA14Ffgo8Jy7u5ll0xH+7WY2jY5HyZf2W/VR0tjSxv9du5u5kzP46Pm53XcYBEnxAT6yaApLCjJ5Zucxntp+lPVvVTFn8mjmTs6gpS0Y0e3/J0+3sq+qgX2VDZQeP0VpVQNbymqpa2qlqbX7RzumJsUzJjmBMSkJZKUmEWeQl5VC7tgUJo0e1esfCqdb2qlqaOZQTSMVNacpr2nkeEML0DGFbu7k0cyZlMH07DQtcyCD5pp5E/nH3+3grWP1zOzFOlvR0G3oh8bo7wLW0TFl8xF332FmDwDF7r4G+DHwqJmVANV0/GAAuAR4wMzagHbgDnevHogDGUw/eGEfR+ua+I+bF3Y7a2awTRmbwl8uK6D0eAMbSqvZWl7LpgPV/GpTOVOzUsjLTCFnbDJxZgTdaW0PUlnXzNG6Jg7Xnn4nSAESAkZeZgpZqYlMz04jI3SBMykhjvg4Iy7OCAadprYgTa3tnGpu4+TpVmobWzlW18zuI/WsD1t7PD7OmDh6FOPTk8hOTyIrLYmUhAApiQGSEgK0tTvtwSDN7UFqTrXwZsVJGprbOHGq5Z2Lr9AR8lPGJrM4P5MZ49OZkJE0rC6ko/5yAAALfUlEQVSkychx9byJfPX3O3l8cwX/+/2DN5mjLyKajuDua4G1nfbdH/a6Cbihi36/AX7TxxqHlPLqRh5aX8p1503mgvzMaJdzRtPGpTFtXBqt7UH2VTYQH4ijrPoU+4+feufJP2YdQZydnsSk0cnMmZRBwbhUpmenMX18Grljk4kPxPV6KmLQnUtnZlNW3Uh5dSNl1Y0cqj3N8YZm9h8/xeaDNTS2tHO6tZ3w1aMT4+MYm5KAYe+cxY9LSyQrNYnJY0YxOjlBIS9Dwvj0UVw1dwKPFZfzhStnDotraZqD1kNfX7uLgBn3vX9WtEuJSEIgjlmTMqIyKyXOjNzMFHIzU87azt1paQ8SHxdHnPFOoGveuwwHty6dyto3j/LktiN89Pwp0S6nWxr87IFXSo7z1PajfO6y6XoARj8yM5LiAwTiTGfwMuxcOC2L6dmp/HzDwWiXEhGFfoSaWtv58m+3k5eZwmcumRbtckRkiDAzbl06lTfKa3mz4mS0y+mWQj9C33uuhNLjp/jah+YNi3E7ERk8H140heSEwLA421foR2D30Tp++D/7Qs+uzY52OSIyxIxOTuD6hZP53dZDnGxsjXY5Z6XQ70Z70Pnib95kdHIC/3jtnGiXIyJD1C1LptLUGuTRDQeiXcpZKfS78ZOX97O1vJb7PziHsbqNX0TOYF7OaK6cM4EfvLCPqvrmaJdzRgr9s3ijvJZv/mE3V8yewHXnTY52OSIyxN13zSya24L8v2ffinYpZ6TQP4Paxhbu/MXrjE8fxb/ccK6mEopIt6Zlp3Hr0qmsfq2MPUfro11OlxT6XXB3/u7XW6msb+LBWxYxJkXDOiISmc9fXkhaUjxfX7sr2qV0SaHfhe+/sI9nd1Vy3zWzWZA7JtrliMgwMjY1kb9+XyH/81YVz+0+Fu1y3kWh38mjGw7y7XV7+OB5k/nLZfnRLkdEhqG/uGgqMyekcc9jWymvbox2OX9GoR/m8c0V/ONvt3P5rPH86w3naRxfRHolKT7Ayo8X0R50bn90M40tbdEu6R0K/ZDfvXGIf3h8K++ZMY4Hb1mkNdlFpE/yx6Xy3ZsWsudoHf/w+Dbch8ZDAWM+2Vrbg/yfJ3fy+dVvUJSfycq/OF/LLIhIv7jsnPH8w/JZPLntCF/77120B6Mf/DG9tPKxuibuWvU6mw7UcNuFU/nStXN0hi8i/eqvLpnG4drTPPzSfvZVNfCdmxaSEcVHrMZk6De2tPHjF/fz0PpS2oPOd25cwIoFOdEuS0RGIDPjgRXzmDkhnX9as4Prv/cyD96yiNmTMqJST0SntWa23Mz2mFmJmd3bxftJZvar0PsbzSw/7L37Qvv3mNnV/Vd6z1XVN/Pwi6Vc8q0X+Ndn3uKi6Vn8993vUeCLyIC7delUVn1mKSdPt/L+777IXate561jg38DV7dn+mYWAB4ErgQqgE1mtsbdd4Y1+xRQ4+4zzOxG4JvAx8xsDh3Py50LTAaeNbOZ7t7OIGgPOiWVDWw+WMNT24/wcslxgg6LCzJ56OOLOH/q0H3coYiMPIsLMnn2C5fy8Eul/PTlA/z3m0e4uDCby2eN532zxnf7lLn+EMnwzmKgxN1LAcxsNbACCA/9FcA/hV4/DnzPOuY7rgBWu3szsD/04PTFwKv9U/6fnGpu4w/bj1JRc5qKmkYOVjey83AdDc0dU6VyM5P53GUzuG7B5GHz1HoRGXnGpiby91fP4tPvmcYjL+/n91sP85U1O/jKmh1cND2LVZ9ZOqBfP5LQzwHKw7YrgCVnauPubWZ2EsgK7d/Qqe+AjKW0tAW559dbAZiQkcSUsSlcv3AyC3PHsiBvDNPGpWrevYgMGWNTE7nnqnO456pz2H/8FM/trhyUaZ2RhH5XSdm5sjO1iaQvZnY7cHtos8HM9kRQ1xkdBF7rffdxwPG+fP0h4s+O45YoFdHHrzvofxcD8P8pomOI1t9PhN51DEO83i7dMkz+bX/m7G+f7RimRvL5kYR+BZAbtj0FOHyGNhVmFg+MBqoj7Iu7rwRWRlLwQDOzYncvinYdfTUSjkPHMDSMhGOAkXEc/XEMkcze2QQUmlmBmSXScWF2Tac2a4DbQq8/CjznHb+nrAFuDM3uKQAK6dNJuIiI9EW3Z/qhMfq7gHVAAHjE3XeY2QNAsbuvAX4MPBq6UFtNxw8GQu0eo+Oibxtw52DN3BERkXeL6OYsd18LrO207/6w103ADWfo+zXga32ocbANiWGmfjASjkPHMDSMhGOAkXEcfT4GGyqLAImIyMDTQjMiIjFEoR+mu+UmhjozyzWz581sl5ntMLPPR7um3jKzgJltMbMno11Lb5nZGDN73Mx2h/5OLox2TT1lZn8b+l7abma/NLNR0a4pEmb2iJlVmtn2sH2ZZvaMme0N/XdsNGvszhmO4duh76dtZvZfZtbjR/sp9EPClpu4BpgD3BRaRmI4aQPucffZwFLgzmF4DG/7PDA0HzIaue8Af3D3WcB5DLPjMbMc4G6gyN3n0TGR48boVhWxnwLLO+27F/ijuxcCfwxtD2U/5d3H8Awwz93PBd4C7uvphyr0/+Sd5SbcvQV4e7mJYcPdj7j766HX9XSEzLBbTc7MpgDXAg9Hu5beMrMM4BI6Zrbh7i3uXhvdqnolHkgO3X+TQhf32QxF7r6ejpmE4VYA/xl6/Z/A9YNaVA91dQzu/rS7v/0Yrg103PvUIwr9P+lquYlhF5hvC610uhDYGN1KeuXfgX8AgtEupA+mAVXAT0LDVA+bWWq0i+oJdz8E/AtQBhwBTrr709Gtqk8muPsR6DhBAsZHuZ6++iTwVE87KfT/JKIlI4YDM0sDfgP8jbvXRbuenjCzDwCV7r452rX0UTywCPiBuy8ETjH0hxP+TGjMewVQQMcqualmdmt0qxIAM/sSHcO5v+hpX4X+n0S0ZMRQZ2YJdAT+L9z9iWjX0wvLgOvM7AAdQ2zvM7OfR7ekXqkAKtz97d+0Hqfjh8BwcgWw392r3L0VeAK4KMo19cUxM5sEEPpvZZTr6RUzuw34AHCL92LOvUL/TyJZbmJICy1n/WNgl7v/W7Tr6Q13v8/dp7h7Ph1/B8+5+7A7u3T3o0C5mZ0T2nU5f74c+XBQBiw1s5TQ99blDLOL0Z2ELxdzG/C7KNbSK2a2HPgicJ27N/bmMxT6IaGLI28vN7ELeMzdd0S3qh5bBnycjrPjN0J/3h/tomLYXwO/MLNtwALg61Gup0dCv6U8DrwOvElHXgyLu1rN7Jd0PLfjHDOrMLNPAd8ArjSzvXQ8FOob0ayxO2c4hu8B6cAzoX/fP+zx5+qOXBGR2KEzfRGRGKLQFxGJIQp9EZEYotAXEYkhCn0RkRii0Bc5CzP7GzNLCdte25uVDUWGCk3ZlJgXuvHI3P1da/2E7gwucvfjg16YyADQmb7EJDPLD61x/306bj76sZkVh9aO/2qozd10rDnzvJk9H9p3wMzGhfX/UajP02aWHGpzQWi981dD659vP1MdIoNNoS+x7BzgZ6EF0e5x9yLgXOBSMzvX3b9Lx/pL73X393bRvxB40N3nArXAR0L7fwLc4e4XAu0DfhQiPaDQl1h20N03hF7/LzN7HdgCzKXjQTrd2e/ub4RebwbyQ+P96e7+Smj/qn6tWKSP4qNdgEgUnQIwswLg74AL3L3GzH4KRPJYwOaw1+1AMl0v0S0yZOhMXwQy6PgBcNLMJtDxyMy31dOxwFVE3L0GqDezpaFdw+XxghIjdKYvMc/dt5rZFmAHUAq8HPb2SuApMztyhnH9rnwK+JGZnQJeAE72Z70ifaEpmyL9zMzS3L0h9PpeYJK7fz7KZYkAOtMXGQjXmtl9dPz7Ogh8IrrliPyJzvRFRGKILuSKiMQQhb6ISAxR6IuIxBCFvohIDFHoi4jEEIW+iEgM+f/UlWRG6yuFSgAAAABJRU5ErkJggg==\n",
+      "text/plain": [
+       "<Figure size 432x288 with 1 Axes>"
+      ]
+     },
+     "metadata": {
+      "needs_background": "light"
+     },
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "sns.distplot(Totaldata['rating'], bins=15)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## We choose 'efficiency' to be our target and we divide the 'rating' column into two classes: $0$ if the rating is below $7$ and $1$ otherwise, which we use as one of our features."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Totaldata['rating'] = (Totaldata['rating'] >6).astype(int)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### $\\color{blue}{\\text{10% of the data}}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def get_data(data, percentage):\n",
+    "    Random=list(range(data.shape[0]))\n",
+    "    np.random.shuffle(Random)\n",
+    "    data=data.iloc[Random]\n",
+    "    return data.iloc[[i for i in range(int(percentage*len(data)))]]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "ten_percent_data=get_data(Totaldata, 0.1)\n",
+    "\n",
+    "ten_percent_data=ten_percent_data[['sideEffects', 'sideEffectsReview',\\\n",
+    "                                   'commentsReview', 'rating', 'effectiveness']]\n",
+    "rating=ten_percent_data['rating']\n",
+    "ten_percent_data=ten_percent_data.drop('rating', axis=1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Features=ten_percent_data.drop(['effectiveness'], axis=1)\n",
+    "Target=ten_percent_data['effectiveness']\n",
+    "Target=le().fit_transform(Target)\n",
+    "\n",
+    "Dat=''\n",
+    "for col in Features.columns: \n",
+    "    Dat += Features[col].map(str) + ' '"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "1004    Mild Side Effects I experienced drowsiness in ...\n",
+       "163     Moderate Side Effects Joint pain, reduction of...\n",
+       "2128    Extremely Severe Side Effects These were sever...\n",
+       "1047    No Side Effects None experienced Applied every...\n",
+       "1838    Mild Side Effects Appetite seems to fluctuate,...\n",
+       "Name: sideEffects, dtype: object"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "Dat.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Text_tranform=CountVectorizer(analyzer='word', max_features=100, stop_words='english', binary=True).fit(Dat)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Text_tranform.vocabulary_;"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Numerical_features=Text_tranform.transform(Dat)\n",
+    "Numerical_features=Numerical_features.toarray()\n",
+    "Data=pd.DataFrame(Numerical_features) \n",
+    "\n",
+    "Data=pd.DataFrame(np.concatenate([rating.values.reshape(-1,1), Data], axis=1))\n",
+    "Data=pd.DataFrame(np.concatenate([Data, Target.reshape(-1,1)], axis=1))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>0</th>\n",
+       "      <th>1</th>\n",
+       "      <th>2</th>\n",
+       "      <th>3</th>\n",
+       "      <th>4</th>\n",
+       "      <th>5</th>\n",
+       "      <th>6</th>\n",
+       "      <th>7</th>\n",
+       "      <th>8</th>\n",
+       "      <th>9</th>\n",
+       "      <th>...</th>\n",
+       "      <th>92</th>\n",
+       "      <th>93</th>\n",
+       "      <th>94</th>\n",
+       "      <th>95</th>\n",
+       "      <th>96</th>\n",
+       "      <th>97</th>\n",
+       "      <th>98</th>\n",
+       "      <th>99</th>\n",
+       "      <th>100</th>\n",
+       "      <th>101</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>1</td>\n",
+       "      <td>4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>5 rows × 102 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   0    1    2    3    4    5    6    7    8    9   ...   92   93   94   95   \\\n",
+       "0    0    1    0    0    1    0    0    0    0    0 ...     0    1    1    0   \n",
+       "1    0    0    0    0    0    0    0    0    0    0 ...     0    0    0    0   \n",
+       "2    0    0    0    0    0    0    0    0    1    0 ...     0    0    0    0   \n",
+       "3    0    0    0    0    0    0    0    0    0    0 ...     0    0    0    0   \n",
+       "4    1    0    0    0    0    0    0    0    0    0 ...     0    0    0    1   \n",
+       "\n",
+       "   96   97   98   99   100  101  \n",
+       "0    1    0    0    0    0    3  \n",
+       "1    0    0    0    1    1    4  \n",
+       "2    0    0    0    0    0    0  \n",
+       "3    0    0    0    0    0    4  \n",
+       "4    0    0    1    0    0    1  \n",
+       "\n",
+       "[5 rows x 102 columns]"
+      ]
+     },
+     "execution_count": 19,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "Data.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Train_features, Test_features, Train_target, Test_target = train_test_split(Data.iloc[:, :-1],\\\n",
+    "        Data.iloc[:, -1], test_size=0.4, random_state=0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Multiclass\\ Logistic\\ Regression}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "weights=np.ones((len(np.unique(Train_target)), 1+Train_features.shape[1]))\n",
+    "\n",
+    "MultiLogReg=MulticlassLogReg(Max_iter=100, lr=0.3)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "MultiLogReg.fit(Train_features, pd.Series(Train_target), weights)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "Predict=MultiLogReg.predict(Test_features)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 29,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{0, 1, 2, 3, 4}"
+      ]
+     },
+     "execution_count": 29,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "set(Predict)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 30,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of Multiclass Logistic Regression: 46.98795180722892%\n"
+     ]
+    }
+   ],
+   "source": [
+    "accuracy=(Test_target==Predict).sum()/len(Test_target)\n",
+    "print(\"Accuracy of Multiclass Logistic Regression: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Bernoulli\\ Naive\\ Bayes}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "NB=Naive_Bayes()\n",
+    "\n",
+    "NB.train(Train_features, pd.Series(Train_target))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "Pred=NB.predict(Test_features)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of my Bernoulli Naive Bayes: 43.373493975903614%\n"
+     ]
+    }
+   ],
+   "source": [
+    "accuracy=(Test_target==Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of my Bernoulli Naive Bayes: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Gaussian\\ Discriminant\\ Analysis}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 29,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Model=GDAMulticlass(regularizer=0.1)\n",
+    "GDA_Model.train(pd.DataFrame(Train_features), pd.Series(Train_target, name='target'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 30,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Pred=GDA_Model.predict(pd.DataFrame(Test_features))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 31,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of GDA: 45.78313253012048%\n"
+     ]
+    }
+   ],
+   "source": [
+    "accuracy=(Test_target==GDA_Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of GDA: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### $\\color{blue}{\\text{30% of the data}}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 32,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "thirty_percent_data=get_data(Totaldata, 0.3)\n",
+    "\n",
+    "thirty_percent_data=thirty_percent_data[['sideEffects', 'sideEffectsReview', \\\n",
+    "                                      'commentsReview', 'rating', 'effectiveness']]\n",
+    "rating=thirty_percent_data['rating']\n",
+    "thirty_percent_data=thirty_percent_data.drop('rating', axis=1)\n",
+    "\n",
+    "Features=thirty_percent_data.drop(['effectiveness'], axis=1)\n",
+    "Target=thirty_percent_data['effectiveness']\n",
+    "Target=le().fit_transform(Target)\n",
+    "\n",
+    "Dat=''\n",
+    "for col in Features.columns: \n",
+    "    Dat += Features[col].map(str) + ' '"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 33,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>0</th>\n",
+       "      <th>1</th>\n",
+       "      <th>2</th>\n",
+       "      <th>3</th>\n",
+       "      <th>4</th>\n",
+       "      <th>5</th>\n",
+       "      <th>6</th>\n",
+       "      <th>7</th>\n",
+       "      <th>8</th>\n",
+       "      <th>9</th>\n",
+       "      <th>...</th>\n",
+       "      <th>92</th>\n",
+       "      <th>93</th>\n",
+       "      <th>94</th>\n",
+       "      <th>95</th>\n",
+       "      <th>96</th>\n",
+       "      <th>97</th>\n",
+       "      <th>98</th>\n",
+       "      <th>99</th>\n",
+       "      <th>100</th>\n",
+       "      <th>101</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>5 rows × 102 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   0    1    2    3    4    5    6    7    8    9   ...   92   93   94   95   \\\n",
+       "0    1    0    0    0    0    0    0    0    0    0 ...     0    0    0    0   \n",
+       "1    0    0    0    0    0    0    0    0    0    1 ...     0    0    0    0   \n",
+       "2    1    0    0    0    0    0    0    1    0    1 ...     0    0    1    0   \n",
+       "3    1    0    1    0    0    0    0    0    0    0 ...     0    0    1    1   \n",
+       "4    1    0    0    0    0    0    0    0    0    0 ...     0    0    0    0   \n",
+       "\n",
+       "   96   97   98   99   100  101  \n",
+       "0    0    0    0    0    0    4  \n",
+       "1    0    0    0    0    0    3  \n",
+       "2    1    0    1    1    0    1  \n",
+       "3    0    0    0    0    0    1  \n",
+       "4    0    0    0    0    0    1  \n",
+       "\n",
+       "[5 rows x 102 columns]"
+      ]
+     },
+     "execution_count": 33,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "Text_tranform=CountVectorizer(analyzer='word', max_features=100, stop_words='english', binary=True).fit(Dat)\n",
+    "\n",
+    "Text_tranform.vocabulary_;\n",
+    "\n",
+    "Numerical_features=Text_tranform.transform(Dat)\n",
+    "Numerical_features=Numerical_features.toarray()\n",
+    "Data=pd.DataFrame(Numerical_features) \n",
+    "\n",
+    "Data=pd.DataFrame(np.concatenate([rating.values.reshape(-1,1), Data], axis=1))\n",
+    "Data=pd.DataFrame(np.concatenate([Data, Target.reshape(-1,1)], axis=1))\n",
+    "\n",
+    "Data.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 34,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Train_features, Test_features, Train_target, Test_target = train_test_split(Data.iloc[:, :-1],\\\n",
+    "        Data.iloc[:, -1], test_size=0.4, random_state=0)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Multiclass\\ Logistic\\ Regression}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 35,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "weights=np.ones((len(np.unique(Train_target)), 1+Train_features.shape[1]))\n",
+    "\n",
+    "MultiLogReg=MulticlassLogReg(Max_iter=100, lr=0.3)\n",
+    "\n",
+    "MultiLogReg.fit(Train_features, pd.Series(Train_target), weights)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 36,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of Multiclass Logistic Regression: 44.46680080482898%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "Predict=MultiLogReg.predict(Test_features)\n",
+    "\n",
+    "accuracy=(Test_target==Predict).sum()/len(Test_target)\n",
+    "print(\"Accuracy of Multiclass Logistic Regression: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Bernoulli\\ Naive\\ Bayes}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "NB=Naive_Bayes()\n",
+    "\n",
+    "NB.train(Train_features, pd.Series(Train_target))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 38,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of my Bernoulli Naive Bayes: 43.05835010060362%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "Pred=NB.predict(Test_features)\n",
+    "\n",
+    "accuracy=(Test_target==Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of my Bernoulli Naive Bayes: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Gaussian\\ Discriminant\\ Analysis}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 39,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Model=GDAMulticlass(regularizer=0.01)\n",
+    "GDA_Model.train(pd.DataFrame(Train_features), pd.Series(Train_target, name='target'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of GDA: 44.668008048289735%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Pred=GDA_Model.predict(pd.DataFrame(Test_features))\n",
+    "\n",
+    "accuracy=(Test_target==GDA_Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of GDA: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### $\\color{blue}{\\text{60% of the data}}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 41,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "sixty_percent_data=get_data(Totaldata, 0.6)\n",
+    "\n",
+    "sixty_percent_data=sixty_percent_data[['sideEffects', 'sideEffectsReview', 'commentsReview', 'rating', 'effectiveness']]\n",
+    "rating=sixty_percent_data['rating']\n",
+    "sixty_percent_data=sixty_percent_data.drop('rating', axis=1)\n",
+    "\n",
+    "\n",
+    "\n",
+    "Features=sixty_percent_data.drop(['effectiveness'], axis=1)\n",
+    "Target=sixty_percent_data['effectiveness']\n",
+    "Target=le().fit_transform(Target)\n",
+    "\n",
+    "Dat=''\n",
+    "for col in Features.columns: \n",
+    "    Dat += Features[col].map(str) + ' '"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Text_tranform=CountVectorizer(analyzer='word', max_features=100, stop_words='english', binary=True).fit(Dat)\n",
+    "\n",
+    "Text_tranform.vocabulary_;\n",
+    "\n",
+    "Numerical_features=Text_tranform.transform(Dat)\n",
+    "Numerical_features=Numerical_features.toarray()\n",
+    "Data=pd.DataFrame(Numerical_features) \n",
+    "\n",
+    "Data=pd.DataFrame(np.concatenate([rating.values.reshape(-1,1), Data], axis=1))\n",
+    "Data=pd.DataFrame(np.concatenate([Data, Target.reshape(-1,1)], axis=1))\n",
+    "\n",
+    "Data.head();"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Train_features, Test_features, Train_target, Test_target = train_test_split(Data.iloc[:, :-1],\\\n",
+    "        Data.iloc[:, -1], test_size=0.4, random_state=0)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Multiclass\\ Logistic\\ Regression}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 44,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "weights=np.ones((len(np.unique(Train_target)), 1+Train_features.shape[1]))\n",
+    "\n",
+    "MultiLogReg=MulticlassLogReg(Max_iter=100, lr=0.3)\n",
+    "\n",
+    "MultiLogReg.fit(Train_features, pd.Series(Train_target), weights)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 45,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of Multiclass Logistic Regression: 46.17706237424547%\n"
+     ]
+    }
+   ],
+   "source": [
+    "Predict=MultiLogReg.predict(Test_features)\n",
+    "\n",
+    "accuracy=(Test_target==Predict).sum()/len(Test_target)\n",
+    "print(\"Accuracy of Multiclass Logistic Regression: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Bernoulli\\ Naive\\ Bayes}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 46,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "NB=Naive_Bayes()\n",
+    "\n",
+    "NB.train(Train_features, pd.Series(Train_target))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 47,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of my Bernoulli Naive Bayes: 45.87525150905433%\n"
+     ]
+    }
+   ],
+   "source": [
+    "Pred=NB.predict(Test_features)\n",
+    "\n",
+    "accuracy=(Test_target==Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of my Bernoulli Naive Bayes: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Gaussian\\ Discriminant\\ Analysis}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Model=GDAMulticlass(regularizer=0.1)\n",
+    "GDA_Model.train(pd.DataFrame(Train_features), pd.Series(Train_target, name='target'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 49,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of GDA: 48.08853118712273%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Pred=GDA_Model.predict(pd.DataFrame(Test_features))\n",
+    "\n",
+    "accuracy=(Test_target==GDA_Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of GDA: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### $\\color{blue}{\\text{100% of the data}}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "whole_data=get_data(Totaldata, 1.0)\n",
+    "\n",
+    "whole_data=whole_data[['sideEffects', 'sideEffectsReview', 'commentsReview', 'rating', 'effectiveness']]\n",
+    "rating=whole_data['rating']\n",
+    "whole_data=whole_data.drop('rating', axis=1)\n",
+    "\n",
+    "\n",
+    "\n",
+    "Features=whole_data.drop(['effectiveness'], axis=1)\n",
+    "Target=whole_data['effectiveness']\n",
+    "Target=le().fit_transform(Target)\n",
+    "\n",
+    "Dat=''\n",
+    "for col in Features.columns: \n",
+    "    Dat += Features[col].map(str) + ' '\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 51,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Text_tranform=CountVectorizer(analyzer='word', max_features=100, stop_words='english', binary=True).fit(Dat)\n",
+    "\n",
+    "Text_tranform.vocabulary_;\n",
+    "\n",
+    "Numerical_features=Text_tranform.transform(Dat)\n",
+    "Numerical_features=Numerical_features.toarray()\n",
+    "Data=pd.DataFrame(Numerical_features) \n",
+    "\n",
+    "#Data=pd.DataFrame(np.concatenate([rating.values.reshape(-1,1), Data], axis=1))\n",
+    "Data=pd.DataFrame(np.concatenate([Data, Target.reshape(-1,1)], axis=1))\n",
+    "\n",
+    "Data.head();\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Train_features, Test_features, Train_target, Test_target = train_test_split(Data.iloc[:, :-1],\\\n",
+    "        Data.iloc[:, -1], test_size=0.4, random_state=0)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Multiclass\\ Logistic\\ Regression}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 53,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "weights=np.ones((len(np.unique(Train_target)), 1+Train_features.shape[1]))\n",
+    "\n",
+    "MultiLogReg=MulticlassLogReg(Max_iter=100, lr=0.3)\n",
+    "\n",
+    "MultiLogReg.fit(Train_features, pd.Series(Train_target), weights)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of Multiclass Logistic Regression: 41.61640530759952%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "Predict=MultiLogReg.predict(Test_features)\n",
+    "\n",
+    "accuracy=(Test_target==Predict).sum()/len(Test_target)\n",
+    "print(\"Accuracy of Multiclass Logistic Regression: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Bernoulli\\ Naive\\ Bayes}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 55,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "NB=Naive_Bayes()\n",
+    "\n",
+    "NB.train(Train_features, pd.Series(Train_target))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 56,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of my Bernoulli Naive Bayes: 39.56574185765983%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "Pred=NB.predict(Test_features)\n",
+    "\n",
+    "accuracy=(Test_target==Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of my Bernoulli Naive Bayes: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Gaussian\\ Discriminant\\ Analysis}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 57,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Model=GDAMulticlass(regularizer=0.1)\n",
+    "GDA_Model.train(pd.DataFrame(Train_features), pd.Series(Train_target, name='target'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 58,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of GDA: 42.5211097708082%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Pred=GDA_Model.predict(pd.DataFrame(Test_features))\n",
+    "\n",
+    "accuracy=(Test_target==GDA_Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of GDA: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Comparison using the Iris data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 59,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from sklearn import datasets\n",
+    "iris=datasets.load_iris()\n",
+    "\n",
+    "x=iris.data[:,:4]\n",
+    "y=(iris.target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 60,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "x_train, x_test, y_train, y_test = train_test_split(x,\\\n",
+    "        y, test_size=0.8, random_state=101)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Multiclass\\ Logistic\\ Regression}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 61,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "weights=np.zeros((len(np.unique(y)), 1+x.shape[1]))\n",
+    "\n",
+    "MultiLogReg=MulticlassLogReg(Max_iter=400, lr=0.2)\n",
+    "\n",
+    "MultiLogReg.fit(pd.DataFrame(x_train), pd.Series(y_train), weights)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 62,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "Ypred=MultiLogReg.predict(x_test)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 63,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'Accuracy of Logistic regression: 97.5%'"
+      ]
+     },
+     "execution_count": 63,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "(\"Accuracy of Logistic regression: {}%\" .format(100*(Ypred==y_test).sum()/len(y_test)))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Bernoulli\\ Naive\\ Bayes}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 64,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "NaiveB=Naive_Bayes()\n",
+    "NaiveB.train(pd.DataFrame(x_train), pd.Series(y_train))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 65,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "Y1pred=NaiveB.predict(pd.DataFrame(x_test))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 66,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of Naive Bayes: 35.833333333333336%\n"
+     ]
+    }
+   ],
+   "source": [
+    "print('Accuracy of Naive Bayes: {}%' .format (100*(Y1pred==y_test).sum()/len(y_test)))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Gaussian\\ Discriminant\\ Analysis}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 67,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA2=GDAMulticlass()\n",
+    "GDA2.train(pd.DataFrame(x_train), pd.Series(y_train, name='target'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 68,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "Y2Pred=GDA2.predict(pd.DataFrame(x_test))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 69,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of GDA: 98.33333333333333%\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(\"Accuracy of GDA: {}%\" .format(100*(Y2Pred==y_test).sum()/len(y_test)))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### We download another data to compare the three models."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 70,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#!wget https://storage.googleapis.com/dataset-uploader/bbc/bbc-text.csv"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 71,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>category</th>\n",
+       "      <th>text</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>tech</td>\n",
+       "      <td>tv future in the hands of viewers with home th...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>business</td>\n",
+       "      <td>worldcom boss  left books alone  former worldc...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>sport</td>\n",
+       "      <td>tigers wary of farrell  gamble  leicester say ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>sport</td>\n",
+       "      <td>yeading face newcastle in fa cup premiership s...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>entertainment</td>\n",
+       "      <td>ocean s twelve raids box office ocean s twelve...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "        category                                               text\n",
+       "0           tech  tv future in the hands of viewers with home th...\n",
+       "1       business  worldcom boss  left books alone  former worldc...\n",
+       "2          sport  tigers wary of farrell  gamble  leicester say ...\n",
+       "3          sport  yeading face newcastle in fa cup premiership s...\n",
+       "4  entertainment  ocean s twelve raids box office ocean s twelve..."
+      ]
+     },
+     "execution_count": 71,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "Text=pd.read_csv(\"bbc-text.csv\")\n",
+    "Text.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 72,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'tv future in the hands of viewers with home theatre systems  plasma high-definition tvs  and digital video recorders moving into the living room  the way people watch tv will be radically different in five years  time.  that is according to an expert panel which gathered at the annual consumer electronics show in las vegas to discuss how these new technologies will impact one of our favourite pastimes. with the us leading the trend  programmes and other content will be delivered to viewers via home networks  through cable  satellite  telecoms companies  and broadband service providers to front rooms and portable devices.  one of the most talked-about technologies of ces has been digital and personal video recorders (dvr and pvr). these set-top boxes  like the us s tivo and the uk s sky+ system  allow people to record  store  play  pause and forward wind tv programmes when they want.  essentially  the technology allows for much more personalised tv. they are also being built-in to high-definition tv sets  which are big business in japan and the us  but slower to take off in europe because of the lack of high-definition programming. not only can people forward wind through adverts  they can also forget about abiding by network and channel schedules  putting together their own a-la-carte entertainment. but some us networks and cable and satellite companies are worried about what it means for them in terms of advertising revenues as well as  brand identity  and viewer loyalty to channels. although the us leads in this technology at the moment  it is also a concern that is being raised in europe  particularly with the growing uptake of services like sky+.  what happens here today  we will see in nine months to a years  time in the uk   adam hume  the bbc broadcast s futurologist told the bbc news website. for the likes of the bbc  there are no issues of lost advertising revenue yet. it is a more pressing issue at the moment for commercial uk broadcasters  but brand loyalty is important for everyone.  we will be talking more about content brands rather than network brands   said tim hanlon  from brand communications firm starcom mediavest.  the reality is that with broadband connections  anybody can be the producer of content.  he added:  the challenge now is that it is hard to promote a programme with so much choice.   what this means  said stacey jolna  senior vice president of tv guide tv group  is that the way people find the content they want to watch has to be simplified for tv viewers. it means that networks  in us terms  or channels could take a leaf out of google s book and be the search engine of the future  instead of the scheduler to help people find what they want to watch. this kind of channel model might work for the younger ipod generation which is used to taking control of their gadgets and what they play on them. but it might not suit everyone  the panel recognised. older generations are more comfortable with familiar schedules and channel brands because they know what they are getting. they perhaps do not want so much of the choice put into their hands  mr hanlon suggested.  on the other end  you have the kids just out of diapers who are pushing buttons already - everything is possible and available to them   said mr hanlon.  ultimately  the consumer will tell the market they want.   of the 50 000 new gadgets and technologies being showcased at ces  many of them are about enhancing the tv-watching experience. high-definition tv sets are everywhere and many new models of lcd (liquid crystal display) tvs have been launched with dvr capability built into them  instead of being external boxes. one such example launched at the show is humax s 26-inch lcd tv with an 80-hour tivo dvr and dvd recorder. one of the us s biggest satellite tv companies  directtv  has even launched its own branded dvr at the show with 100-hours of recording capability  instant replay  and a search function. the set can pause and rewind tv for up to 90 hours. and microsoft chief bill gates announced in his pre-show keynote speech a partnership with tivo  called tivotogo  which means people can play recorded programmes on windows pcs and mobile devices. all these reflect the increasing trend of freeing up multimedia so that people can watch what they want  when they want.'"
+      ]
+     },
+     "execution_count": 72,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "Text.text[0]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 74,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Text_tranformer=CountVectorizer(analyzer='word', max_features=400, binary=True).fit(Text['text'])\n",
+    "\n",
+    "bow1=Text_tranformer.transform(Text['text'])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 75,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Data=pd.DataFrame(data=bow1.toarray())\n",
+    "Data.head()\n",
+    "Text['category']=le().fit_transform(Text['category'])\n",
+    "Data['target']=Text['category']"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 76,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Train_features, Test_features, Train_target, Test_target = train_test_split(Data.iloc[:, :-1],\\\n",
+    "        Data.iloc[:, -1], test_size=0.4, random_state=101)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Multiclass\\ Logistic\\ Regression}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 77,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "weights=np.ones((len(np.unique(Train_target)), 1+Train_features.shape[1]))\n",
+    "\n",
+    "MultiLogReg=MulticlassLogReg(Max_iter=100, lr=0.2)\n",
+    "\n",
+    "MultiLogReg.fit(Train_features, Train_target, weights)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 78,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of the Logistic-Regression:  93.14606741573034\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "Predict=MultiLogReg.predict(Test_features)\n",
+    "AccuracyLogRegression=(Predict==Test_target).sum()/(len(Test_target))\n",
+    "print(\"Accuracy of the Logistic-Regression: \", AccuracyLogRegression*100)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Bernoulli\\ Naive\\ Bayes}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 79,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "NB=Naive_Bayes()\n",
+    "\n",
+    "NB.train(Train_features, Train_target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 80,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy Naive Bayes: 86.62921348314607%\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "Pred=NB.predict(Test_features)\n",
+    "\n",
+    "accuracy=(np.array(Test_target)==Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy Naive Bayes: {}%\".format(100*accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "$\\color{blue}{Gaussian\\ Discriminant\\ Analysis}$"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 81,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  training: [=======================================100.0%=======================================]\n"
+     ]
+    }
+   ],
+   "source": [
+    "MulticlassGDA=GDAMulticlass()\n",
+    "\n",
+    "MulticlassGDA.train(Train_features, Train_target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 82,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "  predictions: [=====================================100.0%======================================]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy of the GDA:  93.37078651685393\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "GDA_Pred=MulticlassGDA.predict(Test_features)\n",
+    "\n",
+    "AccuracyGDA=(np.array(Test_target)==GDA_Pred).sum()/len(Test_target)\n",
+    "print(\"Accuracy of the GDA: \", AccuracyGDA*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## $\\color{green}{\\text{Report}}$"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The three algorithms GDA, Naive Bayes and Softmax Logistic Regression were compared on three different data sets: 'drugLib_raw.tsv', Iris data set and 'bbc-text.csv'.\n",
+    "The comparison on the first data set 'drugLib_raw.tsv' was done in four steps: comparison on $10\\%$, $30\\%$, $60\\%$ and finally on $100\\%$ of the data. On these four comparisons, GDA appeared to be the most accurate (even though the accuracy was around $45\\%$ in average), followed very closely by Softmax Logistic Rgression. But it is important to underline that Naive Bayes and GDA are very fast (during the training process) as compared to Softmax Logistic Regression. This is due to the fact that GDA and Naive Bayes are both generative models and don't require any learning algorithm, their parameters are directly computed, no update required. On the other side, the low accuracy observed on the three algorithms is probably due to the fact that the features used are not predictive enough for the target chosen.\n",
+    "\n",
+    "\n",
+    "\n",
+    "On Iris data set (small data set), very good accuracy was observed but only on two of the three algorithms. Again, GDA and Softmax Logistic Regression were the best ($98.33\\%$ vs $97.5\\%$), whereas Naive Bayes gave $35.83\\%$ accuracy. The failure of Naive Bayes (actually Bernoulli Naive Bayes) on this example is due to the fact that features were not binary.\n",
+    "\n",
+    "On the third data set, which also is as big as the first one, we observed good accuracy for the three algorithms. On this particular data set, Softmax was slightly less accurate as compared to GDA ($93.15\\%$ vs $93.37\\%$) and Naive Bayes scored $86.63\\%$.\n",
+    "\n",
+    "\n",
+    "In conclusion, each of the three algorithms is unique and reliable depending on which data we are investigating. The two generative models GDA and Naive Bayes are fast but can give bad results if the (strong) assumptions they are made of are not met. On the other side, Softmax Logistic Regression takes time to train, but is more stable as it uses fewer assumptions and can handle both binary and non-binary features."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/.ipynb_checkpoints/My_binary_search_from_scratch-checkpoint.ipynb b/.ipynb_checkpoints/My_binary_search_from_scratch-checkpoint.ipynb
new file mode 100644
index 0000000..5ad1bbf
--- /dev/null
+++ b/.ipynb_checkpoints/My_binary_search_from_scratch-checkpoint.ipynb
@@ -0,0 +1,115 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Length of the current array: 12\n",
+      "Length of the current array: 6\n",
+      "Length of the current array: 2\n",
+      "Length of the current array: 1\n",
+      "\n",
+      "-1\n",
+      "\n",
+      "Length of the current array: 12\n",
+      "Length of the current array: 5\n",
+      "Length of the current array: 2\n",
+      "\n",
+      "8\n"
+     ]
+    }
+   ],
+   "source": [
+    "\"\"\"You're going to write a binary search function.\n",
+    "You should use an iterative approach - meaning\n",
+    "using loops.\n",
+    "Your function should take two inputs:\n",
+    "a Python list to search through, and the value\n",
+    "you're searching for.\n",
+    "Assume the list only has distinct elements,\n",
+    "meaning there are no repeated values, and \n",
+    "elements are in a strictly increasing order.\n",
+    "Return the index of value, or -1 if the value\n",
+    "doesn't exist in the list.\"\"\"\n",
+    "import numpy as np\n",
+    "\n",
+    "def binary_search_helper(input_array):\n",
+    "    \"\"\"Your code goes here.\"\"\"\n",
+    "    n=len(input_array)\n",
+    "    even=False\n",
+    "    if n%2==0:\n",
+    "        center=n//2\n",
+    "        even=True\n",
+    "    else:\n",
+    "        center=(n-1)//2\n",
+    "    return center, even\n",
+    "    \n",
+    "def binary_search(input_array_, value):\n",
+    "    input_array=input_array_.copy()\n",
+    "    index=-1\n",
+    "    Search=True\n",
+    "    center=binary_search_helper(input_array)[0]\n",
+    "    position=center\n",
+    "    while(index==-1 and Search):\n",
+    "        print(\"Length of the current array:\",len(input_array))\n",
+    "        if input_array[center]>value:\n",
+    "            input_array=input_array[:center]\n",
+    "            center, even_left=binary_search_helper(input_array)\n",
+    "            if even_left:\n",
+    "                position -= center\n",
+    "            else:\n",
+    "                position -= center+1\n",
+    "        elif input_array[center]<value:\n",
+    "            input_array=input_array[center+1:]\n",
+    "            center, even_left=binary_search_helper(input_array)\n",
+    "            position += center+1\n",
+    "        elif input_array[center]==value:\n",
+    "            index=position\n",
+    "        if len(input_array)==0:\n",
+    "            Search=False\n",
+    "    print()\n",
+    "    return index\n",
+    "test_list = [1,3,9,11,15,19,29,171,527.7,1472,-9,78]\n",
+    "test_val1 = 17\n",
+    "test_val2 = 527.7\n",
+    "print(binary_search(test_list, test_val1))\n",
+    "print()\n",
+    "\n",
+    "print(binary_search(test_list, test_val2))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.4"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
diff --git a/LeetcodeExercises.ipynb b/LeetcodeExercises.ipynb
new file mode 100644
index 0000000..353c503
--- /dev/null
+++ b/LeetcodeExercises.ipynb
@@ -0,0 +1,285 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def plusOne(digits):\n",
+    "        if len(digits) == 1:\n",
+    "            if digits[0] == 9:\n",
+    "                return [1, 0]\n",
+    "            else:\n",
+    "                digits[0] += 1\n",
+    "                return digits\n",
+    "        \n",
+    "        if digits[-1] != 9:\n",
+    "            digits[-1] += 1\n",
+    "        else:\n",
+    "            i = -1\n",
+    "            while i > -len(digits):\n",
+    "                digits[i] = 0\n",
+    "                digits[i-1] += 1\n",
+    "                i -= 1\n",
+    "                if digits[i] != 10:\n",
+    "                    break\n",
+    "            if digits[0] == 10:\n",
+    "                digits = [int(\" \".join(str(digits[0])).split()[0]), int(\" \".join(str(digits[0])).split()[1])] + digits[1:]\n",
+    "        return digits\n",
+    "        "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "Dig = [1,9,9]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[2, 0, 0]"
+      ]
+     },
+     "execution_count": 14,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "plusOne(Dig)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def findDiagonalOrder(matrix):\n",
+    "        if len(matrix) == 0:\n",
+    "            return []\n",
+    "        else:\n",
+    "            N, M = len(matrix), len(matrix[0])\n",
+    "            Traversal = []\n",
+    "            Down = False\n",
+    "            for n in range(N+M-1):\n",
+    "                if Down:\n",
+    "                    for c in range(n+1):\n",
+    "                        if c >= N or n-c >= M:\n",
+    "                            continue\n",
+    "                        Traversal.append(matrix[c][n-c])\n",
+    "                else:\n",
+    "                    for c in range(n+1)[::-1]:\n",
+    "                        if c >= N or n-c >= M:\n",
+    "                            continue\n",
+    "                        Traversal.append(matrix[c][n-c])\n",
+    "                Down = not Down\n",
+    "            return Traversal"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "M=np.array([[2,3,-6,1], [39,-2,9.7, 3], [11,9,34, 100]])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[2.0, 3.0, 39.0, 11.0, -2.0, -6.0, 1.0, 9.7, 9.0, 34.0, 3.0, 100.0]"
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "findDiagonalOrder(M)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def longestCommonPrefix(strs):\n",
+    "        if strs == [] or strs == [\"\"]:\n",
+    "            return \"\"\n",
+    "        if len(strs) == 1:\n",
+    "            return strs[0]\n",
+    "        prefix = \"\"\n",
+    "        position = 0\n",
+    "        while True:\n",
+    "            if strs[0] == \"\":\n",
+    "                return \"\"\n",
+    "            item0 = strs[0]\n",
+    "            if position < len(item0):\n",
+    "                caracter = item0[position]\n",
+    "            for item in strs:\n",
+    "                if item == \"\" or item[0] == \"\":\n",
+    "                    return \"\"\n",
+    "                if position >= len(item) or item[position] != caracter:\n",
+    "                    return prefix\n",
+    "            prefix += caracter\n",
+    "            position += 1"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def twoSum1(numbers, target):\n",
+    "        D={}\n",
+    "        for i in range(len(numbers)):\n",
+    "            if target - numbers[i] in D:\n",
+    "                return [D[target - numbers[i]]+1, i+1]\n",
+    "            D[numbers[i]]=i"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def twoSum2(numbers, target):\n",
+    "        i = 0\n",
+    "        j = i+1\n",
+    "        while numbers[i]  + numbers[j] != target:\n",
+    "            while numbers[i]  + numbers[j] < target:\n",
+    "                if j < len(numbers)-1:\n",
+    "                    j += 1\n",
+    "                else:\n",
+    "                    break\n",
+    "            if numbers[i]  + numbers[j] == target:\n",
+    "                return [i+1, j+1]\n",
+    "            i += 1\n",
+    "            j = i+1\n",
+    "        return [i+1, j+1]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 22,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "numbers = [-19,-10,4,389,394,419,429,529,576,618,619,714,802,1113,4223,6789]\n",
+    "target = 6779"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[2, 16]"
+      ]
+     },
+     "execution_count": 23,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "twoSum1(numbers, target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[2, 16]"
+      ]
+     },
+     "execution_count": 24,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "twoSum2(numbers, target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}