Finished viterbi

Kosaro · Kosaro · commit caf666c56000 · 2020-11-12T23:25:32.000-05:00
diff --git a/HMM.ipynb b/HMM.ipynb
@@ -23,7 +23,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 118,
+   "execution_count": 87,
    "outputs": [],
    "source": [
     "import numpy as np\n",
@@ -52,7 +52,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 119,
+   "execution_count": 88,
    "outputs": [],
    "source": [
     "def get_pb1():\n",
@@ -73,6 +73,39 @@
     }
    }
   },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "#### Emission"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 89,
+   "outputs": [],
+   "source": [
+    "def fair_die_emission():\n",
+    "    return 1/6\n",
+    "\n",
+    "def loaded_die_emission(value):\n",
+    "    if value == 6:\n",
+    "        return .5\n",
+    "    else:\n",
+    "        return .1\n",
+    "\n",
+    "def emission(value):\n",
+    "    return np.asarray((fair_die_emission(), loaded_die_emission(value)))"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
   {
    "cell_type": "markdown",
    "source": [
@@ -86,7 +119,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 120,
+   "execution_count": 90,
    "outputs": [
     {
      "name": "stdout",
@@ -108,18 +141,6 @@
     }
    ],
    "source": [
-    "def fair_die_emission():\n",
-    "    return 1/6\n",
-    "\n",
-    "def loaded_die_emission(value):\n",
-    "    if value == 6:\n",
-    "        return .5\n",
-    "    else:\n",
-    "        return .1\n",
-    "\n",
-    "def emission(value):\n",
-    "    return np.asarray((fair_die_emission(), loaded_die_emission(value)))\n",
-    "\n",
     "def viterbi(sequence):\n",
     "    a = np.asarray([[.95,.05],[.05,.95]]) # transition probability\n",
     "    b = emission(sequence[0]) # Emission probability\n",
@@ -163,31 +184,160 @@
    }
   },
   {
-   "cell_type": "markdown",
+   "cell_type": "code",
+   "execution_count": 91,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "0.39891275119173036\n"
+     ]
+    }
+   ],
    "source": [
-    "2. Download the dataset hmm_pb2.csv from Canvas. It represents a sequence of\n",
-    "10000 dice rolls x from the Dishonest casino model but with other values for the a and\n",
-    "b parameters than those from class. Having so many observations, you are going to\n",
-    "learn the model parameters.\n"
+    "def forward(sequence):\n",
+    "    tran = np.asarray([[.95,.05],[.05,.95]]) # transition probability\n",
+    "    b = emission(sequence[0]) # Emission probability\n",
+    "    p = np.asarray((.5,.5)) # Start probability\n",
+    "    a = np.ndarray((sequence.size, 2))\n",
+    "    a[0] = b*p\n",
+    "    for i in range(1,sequence.size):\n",
+    "        a[i] = emission(sequence[i]) * np.sum(a[i-1]*tran, axis=1)\n",
+    "    return a\n",
+    "\n",
+    "a = forward(get_pb1())\n",
+    "print(a[124,0]/a[124,1])"
    ],
    "metadata": {
-    "collapsed": false
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 137,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "3.856448201261194\n"
+     ]
+    }
+   ],
+   "source": [
+    "def backward(sequence):\n",
+    "    tran = np.asarray([[.95,.05],[.05,.95]]) # transition probability\n",
+    "    B = np.ndarray((sequence.size, 2))\n",
+    "    B[-1] = np.ones(2)\n",
+    "    for i in range(sequence.size-2, -1, -1):\n",
+    "        B[i] = np.sum(tran*B[i+1]*emission(sequence[i+1]), axis=1)\n",
+    "        B[i] *=6 # multiply by constant to avoid overflow\n",
+    "    return B\n",
+    "\n",
+    "B = backward(get_pb1())\n",
+    "print(B[124,0]/B[124,1])"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
    }
   },
   {
    "cell_type": "markdown",
    "source": [
+    "2. Download the dataset hmm_pb2.csv from Canvas. It represents a sequence of\n",
+    "10000 dice rolls x from the Dishonest casino model but with other values for the a and\n",
+    "b parameters than those from class. Having so many observations, you are going to\n",
+    "learn the model parameters.\n",
+    "\n",
     "Implement and run the Baum-Welch algorithm using the forward and backward\n",
     "algorithms that you already implemented for Pb 1. You can initialize the $\\pi,a,b$ with\n",
     "your guess, or with some random probabilities (make sure that $\\pi$ sums to 1 and that\n",
     "$a_{ij}, b^i_k$\n",
     "sum to 1 for each $i$). The algorithm converges quite slowly, so you might need\n",
     "to run it for up 1000 iterations or more for the parameters to converge.\n",
-    "Report the values of $\\pi,a,b$ that you have obtained. (4 points)\n",
-    "\n"
+    "Report the values of $\\pi,a,b$ that you have obtained. (4 points)\n"
    ],
    "metadata": {
-    "collapsed": false
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 151,
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "c:\\users\\okosa\\pycharmprojects\\regressionasignment\\venv\\lib\\site-packages\\ipykernel_launcher.py:8: RuntimeWarning: invalid value encountered in true_divide\n",
+      "  \n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "pi [0.71477891 0.28522109]\n",
+      "a [[2.72155818e-179 4.85324561e-181]\n",
+      " [3.87594275e-180 2.70099412e-179]]\n",
+      "b [[nan nan]\n",
+      " [nan nan]\n",
+      " [nan nan]\n",
+      " [nan nan]\n",
+      " [nan nan]\n",
+      " [nan nan]]\n",
+      "b sum [nan nan]\n"
+     ]
+    }
+   ],
+   "source": [
+    "def baum_welch(sequence):\n",
+    "    for _ in range(20):\n",
+    "        # Expection step\n",
+    "        a = np.asarray([[.95,.05],[.05,.95]]) # transition probability\n",
+    "        A = forward(sequence)\n",
+    "        B = backward(sequence)\n",
+    "        emissions = np.asarray([emission(i) for i in range(1,7)])\n",
+    "        gamma = A*B / np.sum(A*B, axis=1)[np.newaxis].T\n",
+    "        eta = np.ndarray((sequence.size,2,2))\n",
+    "        for t in range(sequence.size):\n",
+    "            for i in range(2):\n",
+    "                for j in range(2):\n",
+    "                    temp = A[t,i]*a[i,j]*B[t,j]*(emissions[int(sequence[t]-1)][j])\n",
+    "                    eta[t,i,j] = temp\n",
+    "\n",
+    "        # maximization step\n",
+    "        pi = gamma[0]\n",
+    "        for i in range(2):\n",
+    "            for j in range(2):\n",
+    "                a[i,j] = np.sum(eta[:,i,j])\n",
+    "        for i in range(2):\n",
+    "            for k in range(1,7):\n",
+    "                emissions[k-1,i] = np.sum(gamma[sequence==k, i])/np.sum(gamma)\n",
+    "    print(\"pi\", pi)\n",
+    "    print(\"a\", a)\n",
+    "    print(\"b\",emissions)\n",
+    "    print(\"b sum\",np.sum(emissions, axis=0))\n",
+    "\n",
+    "\n",
+    "\n",
+    "baum_welch(get_pb2())\n"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
    }
   }
  ],