take linear algebra to its own file

gkarwchan · gkarwchan · commit 9a319a93967c · 2019-11-20T20:41:49.000-07:00
diff --git a/Calgary Census.ipynb b/Calgary Census.ipynb
@@ -370,7 +370,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.0"
+   "version": "3.6.8"
   }
  },
  "nbformat": 4,
diff --git a/Linear Algebra.ipynb b/Linear Algebra.ipynb
@@ -0,0 +1,151 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Linear Algebra In Supervised Learning:  \n",
+    "\n",
+    "Linear Algebra is the basis of building models in machine learning.  \n",
+    "A very simple example:  \n",
+    "\n",
+    "Predict House Price from its size:\n",
+    "\n",
+    "Create a math function called **Hypothesis** to predict the price of the house.\n",
+    "\n",
+    "\\begin{align}\n",
+    "\\Large\n",
+    "y^i = h_\\theta(x^i) & = \\theta_0 + \\theta_1 x^i \\\\\n",
+    "\\end{align}\n",
+    "\n",
+    "\n",
+    "Linear algebra is using as the basis of any math in any machine learning algorithm.  \n",
+    "\n",
+    "The above formula for one input variable.  \n",
+    "But what if we have multi input variables?  \n",
+    "\n",
+    "\\begin{align}\n",
+    "\\Large\n",
+    "y^i = h_\\theta(x_1^i, x_2^i, ...) & = \\theta_0 + \\theta_1 x_1^i + \\theta_2 x_2^i + ... \\\\\n",
+    "\\end{align}\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Practical Example: Use Matrix calculation in Supervised Learning\n",
+    "\n",
+    "\n",
+    "![Matrix calc](img/LA-26.png)\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Iris dataset in Scikit-learn module:\n",
+    "scikit-learn comes with a few standard datasets, and iris is one of them.  \n",
+    "It is formatted in a way to be used by machine learning.   "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "type of iris:  <class 'sklearn.utils.Bunch'>\n",
+      "dict keys:  dict_keys(['data', 'target', 'target_names', 'DESCR', 'feature_names', 'filename'])\n",
+      "type of iris data:  <class 'numpy.ndarray'>\n",
+      "iris column names:  ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)']\n",
+      "the target:  [0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n",
+      " 0 0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1\n",
+      " 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2 2 2\n",
+      " 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2\n",
+      " 2 2]\n"
+     ]
+    }
+   ],
+   "source": [
+    "from sklearn import datasets\n",
+    "iris_sk = datasets.load_iris()\n",
+    "print ('type of iris: ', type(iris_sk))\n",
+    "print ('dict keys: ' , iris_sk.keys())\n",
+    "print ('type of iris data: ', type(iris_sk.data))\n",
+    "print ('iris column names: ' , iris_sk.feature_names)\n",
+    "print ('the target: ', iris_sk.target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "\n",
+    "X = np.asmatrix(iris_sk.data)\n",
+    "\n",
+    "x = np.transpose(X)\n",
+    "\n",
+    "T = x.dot(X)\n",
+    "\n",
+    "inv = np.linalg.inv(T)\n",
+    "\n",
+    "theta = (inv.dot(X.T)).dot(iris_sk.target)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "matrix([[-0.0844926 , -0.02356211,  0.22487123,  0.59972247]])"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "theta"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.8"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/more on pandas statistics.ipynb b/more on pandas statistics.ipynb
@@ -63,106 +63,6 @@
     "# resampled=data.resample('A')\n",
     "# resampled.plot()"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datetime import datetime as dt\n",
-    "import mpl_finance"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "metadata": {},
-   "outputs": [
-    {
-     "ename": "AttributeError",
-     "evalue": "module 'mpl_finance' has no attribute 'quotes_historical_yahoo_ochl'",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
-      "\u001b[0;32m<ipython-input-8-bfdf1a64e1da>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m      3\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m \u001b[0msymbol\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m\"EWN\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 5\u001b[0;31m quotes = mpl_finance.quotes_historical_yahoo_ochl(symbol, start,\n\u001b[0m\u001b[1;32m      6\u001b[0m end, asobject=True)\n",
-      "\u001b[0;31mAttributeError\u001b[0m: module 'mpl_finance' has no attribute 'quotes_historical_yahoo_ochl'"
-     ]
-    }
-   ],
-   "source": [
-    "start = dt(1996, 3, 22) \n",
-    "end = dt(2013, 5, 4)\n",
-    "\n",
-    "symbol = \"EWN\"\n",
-    "quotes = mpl_finance.quotes_historical_yahoo_ochl(symbol, start,\n",
-    "end, asobject=True)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "['Affine2D',\n",
-       " 'Line2D',\n",
-       " 'LineCollection',\n",
-       " 'PolyCollection',\n",
-       " 'Rectangle',\n",
-       " 'TICKLEFT',\n",
-       " 'TICKRIGHT',\n",
-       " '__builtins__',\n",
-       " '__cached__',\n",
-       " '__doc__',\n",
-       " '__file__',\n",
-       " '__loader__',\n",
-       " '__name__',\n",
-       " '__package__',\n",
-       " '__spec__',\n",
-       " '_candlestick',\n",
-       " '_check_input',\n",
-       " '_plot_day_summary',\n",
-       " 'absolute_import',\n",
-       " 'candlestick2_ochl',\n",
-       " 'candlestick2_ohlc',\n",
-       " 'candlestick_ochl',\n",
-       " 'candlestick_ohlc',\n",
-       " 'division',\n",
-       " 'index_bar',\n",
-       " 'mcolors',\n",
-       " 'np',\n",
-       " 'plot_day_summary2_ochl',\n",
-       " 'plot_day_summary2_ohlc',\n",
-       " 'plot_day_summary_oclh',\n",
-       " 'plot_day_summary_ohlc',\n",
-       " 'print_function',\n",
-       " 'unicode_literals',\n",
-       " 'volume_overlay',\n",
-       " 'volume_overlay2',\n",
-       " 'volume_overlay3',\n",
-       " 'xrange',\n",
-       " 'zip']"
-      ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "dir (mpl_finance)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
@@ -181,7 +81,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.0"
+   "version": "3.6.8"
   }
  },
  "nbformat": 4,

Original file line number	Diff line number	Diff line change
`@@ -370,7 +370,7 @@`
`370`	`370`	`"name": "python",`
`371`	`371`	`"nbconvert_exporter": "python",`
`372`	`372`	`"pygments_lexer": "ipython3",`
`373`		`- "version": "3.7.0"`
	`373`	`+ "version": "3.6.8"`
`374`	`374`	`}`
`375`	`375`	`},`
`376`	`376`	`"nbformat": 4,`