update Chapter3

Qiuping Xu · Qiuping Xu · commit 2afa1477b510 · 2021-12-20T09:41:53.000-07:00
diff --git a/Chapter_3_sec_6.1_6.7.ipynb b/Chapter_3_sec_6.1_6.7.ipynb
@@ -20,8 +20,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# In Python, module can be imported by a command similar to 'import numpy as np'. \n",
-    "# It is a good practice to maintain a section at the beginning of the notebook to import all necessary modules.\n",
+    "# in Python, module can be imported by a command similar to 'import numpy as np'. \n",
+    "# it is a good practice to maintain a section at the beginning of the notebook to import all necessary modules.\n",
     "# for new module, could use pip to install it. \n",
     "# for example 'pip install numpy'\n",
     "import numpy as np\n",
@@ -110,7 +110,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Use dir() to get a list of all the attributes an object has\n",
+    "# use dir() to get a list of all the attributes an object has\n",
     "dir(lm)"
    ]
   },
@@ -190,7 +190,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# As mentioned above. For machine learning models, sklearn is the most common used module, but sklearn is a little bit less on statistics.\n",
+    "# as mentioned above. For machine learning models, sklearn is the most common used module, but sklearn is a little bit less on statistics.\n",
     "x = pd.DataFrame(Boston.lstat)\n",
     "y = Boston.medv\n",
     "print(x.shape)\n",
@@ -235,7 +235,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# If we want to use all the variable. We can use the following trick to manually construct the list. In Python, most of time, you have to manully construct the variable list.\n",
+    "# if we want to use all the variable. We can use the following trick to manually construct the list. In Python, most of time, you have to manully construct the variable list.\n",
     "all_columns = \"+\".join(Boston.columns.difference([\"medv\"]))\n",
     "my_formula = \"medv~\" + all_columns\n",
     "lm = smf.ols(my_formula, data=Boston).fit()\n",
@@ -345,10 +345,10 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# There is anova function built in already in statsmodels.  \n",
-    "# If you know what to do, use the key words to google it and likely you will find a very good answer. \n",
-    "# Here we compare the models with one order of stat and two orders of stats. \n",
-    "# By looking at the p value that will reject the null hypothesis that the coefficent of lstat**2 equals 0.\n",
+    "# there is anova function built in already in statsmodels.  \n",
+    "# if you know what to do, use the key words to google it and likely you will find a very good answer. \n",
+    "# here we compare the models with one order of stat and two orders of stats. \n",
+    "# by looking at the p value that will reject the null hypothesis that the coefficent of lstat**2 equals 0.\n",
     "table = sm.stats.anova_lm(lm_order1, lm_order2)\n",
     "print(table)"
    ]
@@ -456,7 +456,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Then the model buliding will be the same with all numerrical variables.\n",
+    "# then the model buliding will be the same with all numerrical variables.\n",
     "lm_carseats_dummy = smf.ols('Sales ~ Income + Advertising + Price + Age + ShelveLoc_Good + ShelveLoc_Medium', \n",
     "                            data = Carseats_dummy).fit()"
    ]
@@ -467,7 +467,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# The interpretation of the coefficients are holding everything fixed, Medium shelve location is associated with an average\n",
+    "# the interpretation of the coefficients are holding everything fixed, Medium shelve location is associated with an average\n",
     "# increase of sale around 2.0046. \n",
     "lm_carseats_dummy.summary() "
    ]
@@ -499,9 +499,9 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Let us write a simple function to print current time. \n",
-    "# The key word in Python for user defined function is 'def'. \n",
-    "# Pay attention to the ':'. The difference betwwen R (others) and Python is that Python \n",
+    "# let us write a simple function to print current time. \n",
+    "# yhe key word in Python for user defined function is 'def'. \n",
+    "# pay attention to the ':'. The difference betwwen R (others) and Python is that Python \n",
     "# forces you to obey its indentation rules. For example, the following function won't work because of the extra space in front of 'print'.\n",
     "def print_current_time_wrong():\n",
     "    from datetime import datetime # this is very bad practice !!! \n",
@@ -559,7 +559,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.5.6"
+   "version": "3.6.2"
   }
  },
  "nbformat": 4,