{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "colab_type": "code",
    "id": "6iaJVt_LXXDG",
    "outputId": "a5522632-df43-4c72-f098-6bcc67bc7989"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(100,)\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXQAAAD4CAYAAAD8Zh1EAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAAgAElEQVR4nO3deXhU5fn/8fc9kxWyQFYCBAKyJkBYImgR91JQCkhdQGzFXVut1rZf9WfV4m7VYqla97V1w2qliEVUtBTZghK2QBIgkCCEkEBICNmf3x8zgck+IZOcyeR+XVeumTnr5zxncufkmTPniDEGpZRSnZ/N6gBKKaU8Qwu6Ukr5CC3oSinlI7SgK6WUj9CCrpRSPsLPqhVHRUWZhIQEq1avlFKd0oYNGw4ZY6IbG2dZQU9ISCA1NdWq1SulVKckInuaGqddLkop5SO0oCullI/Qgq6UUj7Csj50pZTvq6ysJDc3l7KyMqujdDpBQUH07dsXf39/t+fRgq6Uaje5ubmEhoaSkJCAiFgdp9MwxlBQUEBubi4DBgxwe74Wu1xE5DUROSgiW5oYLyKyUESyRGSTiIxtRW6llA8rKysjMjJSi3kriQiRkZGt/s/GnSP0N4BngbeaGD8VGOz8mQD8zfnYvnLWQfZKSJjkeF37PH58w/Guw9LegZJ8CImB5DmQtw2+fwtC42Di7SenbWp9B7fDvlQYPh1+PP/kMhHH8urPXztfcCQcLziZp7F8Ta3XdfnQcH056yDtXSjJg+NHoCgX/INgwi8hZV697Y6G5Cubzlk/T+obkP4JDJ/hWFZzbVN/G+vn75UMBzY23VbNbXuv5JPLhrpZazP2GgVBYU23aXPb6M57oEG2dwEDvUY33O6W1tlRWrv+dsirxfzUnEq7iTuXzxWRBGCJMWZEI+NeBL42xrzrfL0DONcYs7+5ZaakpJhTPg89Zx28OR2qK8DmBxioqQZ7AFy92DFN7XjXYW9c7BhWy+YHNVUur/3hmqWN/1K+OR2qyhzrqjXyctj2r5PLtAfCvCV1i9mb06G6HEwNYAO/QJjyOPzn7rr5mipArplt/s5trTq5vql/gs/+z7GOxky8A9Y8X3e77QEw79NGctbLk/oGLLn95HzT/tKwqJ9om3KgBsTmyNVUm5/IUK+tWtp2RwOA3Q8QRxvYA2DCTbDqGZdpBPyCGrapu9vY1HugQbZpddvcdbtbateO0tr1t0Pe9PR0hg8f3qZldGWNtZ+IbDDGpDQ2vSfOcukD5Li8znUOa0BEbhSRVBFJzc/PP6WV5ReXc3DzF5jqCjDVmOoKTHUlmGrHGzF7pePHOb7usMq6C3Mt5gA1lY7p6qtdHvX++GUtr7vM2nXVn8/U1K7A8Tr9k4b5GlM/c01l3cyuy2pK+uKG211d2UTOennSP6m3rHqvXefFuY2mpvk2d83e1HafWG79eWscw1yzpi+uN41pfNnubmNT74HGllVntTXN7P8W9nN7ae36rc6r2qxDT1s0xrxkjEkxxqRERzf6zdUWffRdLjevDKasxk6VsVFh7FQYO1XYKDN2fr06hLu/C6ccP6qxUYEfbx/ox0eFA6gSfwyc/BG/uiXa5n/yX3pXCZMcRyzU+xdo0I/B7vIJtD2g7vy180ltM9scr4fPcA63N5ynwXpdlm/zd/5H4rK+2mU1Zfj0ussAx+tGc9bLM3xGvWXVe+06b+1bSWwnl1E/f50MzWz3ieXWn9fmGOaadfj0etNI48t2dxubeg80tqw6q7U1s/9b2M/tpbXrtzqvBS699FJ27drVpmUsWrSIpKQkbDZbg2+/t3R5k4qKCs4++2yqqqqanc5dna7LZfehY2zff5SAA6n0yFvH7pAxlFVW0+twKumBo9hmH0ZJeRVxRzcx+Hgaq6qG8b+ygVTVGMZKBrPsK4miiEOE81H1JIZIDlf6f80Rvyg+Db2cgp6jiQ0LJDYsiNiwQGLCgogNDaJPySZCD6zFlq996I1m1D507UNvhDd3uWzdupU//OEPfPzxx21aTnp6OjabjZtuuomnnnqKlJSTvSEJCQlkZ2c3O//8+fMZNGgQc+fObXTZrely8URBvxi4FbgIx4ehC40xLb4T2tSH3krGGMoqazhaVsmR0koOl1Zw+FgFBcdcHksrKDxWQX5xOfnF5RQca9iN4W8XevcIJr5nN+IjgunbsxvxEd2I7xlMv4huRHQP0A+AlHLhWpDm/3sr23446tHlJ/YO44GfJjU7TXZ2NlOmTGHcuHF89913JCUl8dZbb/Hwww8zZMgQ5s2bx2uvvcamTZt45hnH5zEvv/wy27ZtY8GCBW5nOffcc5ss6Hv27OHCCy9k9erVREREcM4553DfffcxefJk0tLSuOeee1i6dGmDZba2oLd4louIvAucC0SJSC7wAOAPYIx5AViKo5hnAaXANW5tfQcSEYID7AQH2IkNC3JrnoqqGvJLyjlQVMbBo2XkHS3jwNFy9h05zt7CUj7fmteg6IcE+nFaTAiDa39iQxgcE0qfHsHYbFrolbLKjh07ePXVV5k4cSLXXnstzz//PKtWrWLOHMd/vZdffjmPPPIITz75JP7+/rz++uu8+OKLAEyaNIni4uIGy3zqqae48MIL3Vp///79ueuuu7jlllsYP348iYmJTJ48GYARI0awfv16j2xniwXdGDOnhfEG+JVH0niRAD8bfXoE06dHcJPTHCuvIvfwcXIKS9lbWMqegmNk5Zfw34x8PtyQe2K6YH87g2JCGNYrlFHxPRjdtwdDe4US4KdXXlBdR0tH0u0pPj6eiRMnAnDVVVexcOFC9u/fT+1neSEhIZx//vksWbKE4cOHU1lZyciRIwFYudIzHw5ff/31LFq0iBdeeIGNGzeeGG632wkICKC4uJjQ0NA2rUO/KdoG3QP9GNorlKG9Gu6EotJKsvKLycwrIfNgCRl5xXy5/SCLnIU+wM/G8LgwkvuGk9y3B8nxPTgturt22SjVDur/XokIwcHBdb64c/311/Poo48ybNgwrrnmZEeDJ47QAUpLS8nNdfz+l5SU1Cne5eXlBAW513vQHC3o7SS8mz/j+kcwrn/EiWHGGHIPH2dTbhFpuUdIyznCPzfk8tZqx+WNo0IC+dFpkUwcFMnEQVH07dnNqvhK+ZS9e/eyevVqzjzzTN555x3OOussAgMDycrKOnEmyoQJE8jJyeG7775j06ZNJ+b11BH6XXfdxdy5c+nfvz833HADS5YsAaCgoICoqKhWXbOlKVrQO5CIOD5EjejGxaPiAKiuMezML+H7vYf5dmcBq7IKWJz2AwD9I7vxo9OiHAX+tCh6dm/m9ESlVJOGDh3Kc889x7XXXktiYiK33HILMTExfP3113WOsi+//HI2btxIz5493V72xx9/zG233UZ+fj4XX3wxo0ePZtmyZXWm+eabb1i/fj2rVq3Cbrfzz3/+k9dff51rrrmGFStWcPHFF3tkO906y6U9dORZLp2JMYbMgyX8L/MQ3+48xJpdhZSUV2G3CWcMjGDqiDh+ktSL6NBAq6Mq1SJvOG0xOzubadOmsWVL3ctRHT9+nPPOO+9EkQWYNm0av/nNb7jgggs8sm53TlucNWsWjz/+OEOGDGkwzuNnuaiOJSIMiQ1lSGwo1541gKrqGtJyi/hqex5LNx/gD//awv2fbGH8gAguGhnHlKRexLh55o5S6qTg4GDmz5/Pvn37CAsLY/z48SQnJ3usmLujoqKCmTNnNlrMT4UeoXcixhh25BWzdPMBPtu8n8yDJYjA6f0juGRsH2aM7k23AP0brbyHNxyhW+mZZ57hjjvuOOX52+WLRe1BC3rbZeYV89mWAyzZ9AMZeSWEBvoxa2wf5p7RnyGxbTv9SSlP6OoFva20y6ULGRwbyuDYUG47fxAb9hzmH2v38u66HN5cvYfxCRHMPaMfU0b0ItDPbnVUpVQH0ILuA0SElIQIUhIiuG9aIotSc/jH2r3c/t5GIrsHcMXp8Vx71gCiQvSDVKV8mRZ0HxPRPYCbzjmNGyYNZGXWIf6+Zg8vfLOT11dlc/WPErjx7IFE6OmPSvkk/e65j7LZhHOGRPPyL1JYfuc5TE6K5cX/7mTSE1/x5LLtHClt5hrqSvkQu93O6NGjSUpKIjk5maeffpqamppm58nOzuadd97poISeowW9CzgtOoS/zB7D53eczXnDYnhuxU7OemIFf16eQdHxJm5AoZRVctbByqcdjx4QHBzMxo0b2bp1K8uXL+ezzz5j/vz5zc6jBV15vcGxoTx75Vj+c8ckJg2OYuGXmZz1xFc8tyKLiqrmj1iU6hC1t8H76hHHo4eKeq2YmBheeuklnn32WYwxZGdnM2nSJMaOHcvYsWP59ttvAbj77rtZuXIlo0ePZsGCBU1O5220D70LGtYrjL9dNY5tPxzlz8szeHLZDj7+fh+PzBzBhIGRVsdTXVljt8Hz8I1BBg4cSHV1NQcPHiQmJobly5cTFBREZmYmc+bMITU1lccff5ynnnrqxPVWSktLG53O22hB78ISe4fxytUpfLU9j/s/2coVL63hsnF9ueei4frBqbJG7W3wam9U3c63wausrOTWW29l48aN2O12MjIy2jSd1bSgK84fFsuZA6NY+FUmL/93F1+k53HPRcO5bFxfvZyv6ljx4+Hqxe16275du3Zht9uJiYlh/vz5xMbGkpaWRk1NTZOXsF2wYIFb01lN+9AVAMEBdu6aMoxPfz2J06JD+L8PN3HFi2vIzGt4HWil2lX8eJj023Yp5vn5+dx8883ceuutiAhFRUXExcVhs9l4++23qa6uBiA0NLTONdCbms7baEFXdQztFcoHN53JEz8bScbBYqb+ZSUvfLOTmhprLhGhVFsdP378xGmLF154IZMnT+aBBx4A4Je//CVvvvkmycnJbN++ne7duwMwatQo7HY7ycnJLFiwoMnpvI1ey0U1qaCknPs+2cLSzQc4b2g0T18+WvvWVavotVzaprXXctEjdNWkyJBAnrtyLA/NSGJVVgEXL1xJanah1bGUUk3Qgq6aJSL8/MwEPvrlj/C327jipTXaBaOUl9KCrtwyok84S359FlOSevH4Z9u59s31FB7TyweollnVrdvZnUq7aUFXbgsL8ufZK8fw0Iwkvs0q4KK/rGS9dsGoZgQFBVFQUKBFvZWMMRQUFLT69Ej9UFSdki37ivjVO9+x7/BxnrosmZlj+lgdSXmhyspKcnNzKSsrszpKpxMUFETfvn3x9/evM1xvcKE8bkSfcBbfehY3vpXKHe9vJO9oGTeePVC/iKTq8Pf3Z8CAAVbH6DK0y0WdsvBgf968djwXj4zjsc+28+CSbfphqVIW0iN01SZB/nb+OmcMMWGBvL4qm4PF5Tx9WTJB/nrbO6U6mhZ01WY2m3D/tETiwoN4dOl2DhWX89IvUggP9m95ZqWUx2iXi/IIEeHGs0/jmStG893ew1z+wmoOFOkHYUp1JC3oyqNmjunD6/PGs+/IcWY9v4qsg3pxL6U6ihZ05XFnDY7i/ZvOoKLaMOfltew+dMzqSEp1CW4VdBGZIiI7RCRLRO5uZHw/EVkhIt+LyCYRucjzUVVnktQ7nHdvmEB1jWHuy2vIPVxqdSSlfF6LBV1E7MBzwFQgEZgjIon1JvsD8IExZgwwG3je00FV5zM4NpS3rxtPSXkVc19ZS95R7VNXqj25c4Q+HsgyxuwyxlQA7wEz6k1jgDDn83DgB89FVJ1ZUu9w3rh2PIeKy7nqlbUUlJRbHUkpn+VOQe8D5Li8znUOc/VH4CoRyQWWArc1tiARuVFEUkUkNT8//xTiqs5obL+evDrvdPYWlvKL19ZRdLzS6khK+SRPfSg6B3jDGNMXuAh4W0QaLNsY85IxJsUYkxIdHe2hVavO4IyBkbz483Fk5BUz7/V1lJRXWR1JKZ/jTkHfB8S7vO7rHObqOuADAGPMaiAIiPJEQOU7zh0aw1/njGVTbhHXv7meskrvvC+jUp2VOwV9PTBYRAaISACODz0X15tmL3ABgIgMx1HQtU9FNTBlRC/+fHkya3cXcvPfN1BRVWN1JKV8RosF3RhTBdwKLAPScZzNslVEHhSR6c7JfgvcICJpwLvAPKMXQFZNmDG6D49dMpKvd+TzwOIteq1spTzErWu5GGOW4viw03XY/S7PtwETPRtN+bLZ4/uxt7CU57/eyeCYUK49Sy+xqlRb6TdFlWV+N3kokxNjefjTbXy946DVcZTq9LSgK8vYbMKCK0YztFcYt73zvV73Rak20oKuLNU90I9Xrk4h0N/OdW+mclhvPK3UKdOCrizXp0cwL/58HPuPlHHLPzZQWa1nvih1KrSgK68wrn9Pnrh0JGt2FXL/J1v1zBelToHesUh5jUvG9CUjr4S/fb2TIbEhXDNRz3xRqjX0CF15ld9PHsqPE2N5aMk2vsnQ76Yp1Rpa0JVXsdmEZ64YzZDYUH797vfsO3Lc6khKdRpa0JXX6R7oxwtXjaO6xvDrd7/XD0mVcpMWdOWVEqK68+iskWzYc5gFyzOsjqNUp6AFXXmt6cm9mTM+nue/3qn96Uq5QQu68mr3T0tiaGwod76/kYN6CzulmqUFXXm14AA7z145htKKam5/byPVNXp+ulJN0YKuvN7g2FAenJHE6l0FPPtVltVxlPJaWtBVp3DpuL7MGtOHv3yZweqdBVbHUcoraUFXnYKI8NDMESREduf2976noKTc6khKeR0t6KrT6B7ox7NXjuXI8Uru/CCNGu1PV6oOLeiqU0nsHcb90xL5JiOf11bttjqOUl5FC7rqdOZO6MeFw2P507IdelMMpVxoQVedjojw6KwRdA+w89sP0qjSSwMoBWhBV51UTGgQD80cQVpuES/+d5fVcZTyClrQVac1bVRvpo2K45kvMtj2w1Gr4yhlOS3oqlN7aMYIwoMDuPODjVRUadeL6tq0oKtOrWf3AB6fNZLtB4pZ+GWm1XGUspQWdNXpXZgYy6Xj+vK3b3ayMeeI1XGUsowWdOUT7v9pIrGhgfz2g42UVVZbHUcpS2hBVz4hLMifP12azM78Yzy1bIfVcZSyhBZ05TPOGhzFVWf049VVu1m3u9DqOEp1OC3oyqfcM3U48T278btFaZRWVFkdR6kOpQVd+ZTugX48eeko9haW6r1IVZfjVkEXkSkiskNEskTk7iamuVxEtonIVhF5x7MxlXLfhIGRzBnfj1f/t5vNuUVWx1Gqw7RY0EXEDjwHTAUSgTkiklhvmsHAPcBEY0wScEc7ZFXKbXdPHUZUSCB3/XMTlXqtF9VFuHOEPh7IMsbsMsZUAO8BM+pNcwPwnDHmMIAx5qBnYyrVOuHB/jw4I4lt+4/y6v/0Mruqa3CnoPcBclxe5zqHuRoCDBGRVSKyRkSmNLYgEblRRFJFJDU/P//UEivlpikj4picGMuC5RlkHzpmdRyl2p2nPhT1AwYD5wJzgJdFpEf9iYwxLxljUowxKdHR0R5atVJNe3DGCALsNu7912aM0TscKd/mTkHfB8S7vO7rHOYqF1hsjKk0xuwGMnAUeKUs1Ss8iLumDmNVVgEfbsi1Oo5S7cqdgr4eGCwiA0QkAJgNLK43zb9wHJ0jIlE4umD0ItXKK1w5vh+nJ/Tk4U/TyS/Wm0sr39ViQTfGVAG3AsuAdOADY8xWEXlQRKY7J1sGFIjINmAF8HtjTEF7hVaqNWw24bFZozheUc2DS7ZZHUepdiNW9SumpKSY1NRUS9atuqaFX2by5+UZvDYvhfOHxVodR6lTIiIbjDEpjY3Tb4qqLuPmc05jSGwIf/h4CyXlelkA5Xu0oKsuI8DPxmOzRrH/aJlekVH5JC3oqksZ178nPz+jP2+tztbLAiifowVddTm/+8lQIkMC+X8fb6a6Rs9NV75DC7rqcsKC/Ll/WiKb9xXx9upsq+Mo5TFa0FWXNG1UHJMGR/HU5xnkHS2zOo5SHqEFXXVJIsLDM0dQUV3Dg//Wc9OVb9CCrrqs/pHdue28QXy6eT8rdugFQlXnpwVddWk3njOQgdHduf+TLRyvqLY6jlJtogVddWmBfnYemTmSnMLjPLsi0+o4SrWJFnTV5Z15WiSzxvbhpf/uIjOv2Oo4Sp0yLehKAfdeNJxuAX7c+/EWavTcdNVJaUFXCogMCeSeqcNYl13Ih9/pddNV56QFXSmny1PiSenfk8eWplN4rMLqOEq1mhZ0pZxsNuGRS0ZSXFbFY0vTrY6jVKtpQVfKxdBeoVw3aQCLNuSydpfeo0V1LlrQlarn9gsG06dHMPf+awsVVTVWx1HKbVrQlaqnW4AfD81MIutgCS+v1Fvjqs5DC7pSjTh/WCxTknqx8MtM9haUWh1HKbdoQVeqCQ9MT8TPJtz3yRasuveuUq2hBV2pJsSFB3Pn5KF8k5HP0s0HrI6jVIu0oCvVjKvP7E9S7zDm/3srxWWVVsdRqlla0JVqhp/dxiOXjCS/pJynP8+wOo5SzdKCrlQLRsf3OHFj6U25R6yOo1STtKAr5YbaG0vf+/EWvbG08lpa0JVyg95YWnUGWtCVctO0UXGcPSSapz7PYH/RcavjKNWAFnSl3CQiPDJzBNU1hvv+peemK++jBV2pVoiP6MadPx7CF+kH9dx05XW0oCvVStdMTGBkn3AeWLyVolI9N115Dy3oSrWSn93G4z8byeHSCh7V66YrL+JWQReRKSKyQ0SyROTuZqb7mYgYEUnxXESlvE9S73CunzSA91Nz+HbnIavjKAW4UdBFxA48B0wFEoE5IpLYyHShwO3AWk+HVMob3XHBEPpHduP/fbSZsspqq+Mo5dYR+nggyxizyxhTAbwHzGhkuoeAJ4AyD+ZTymsFB9h59JKRZBeUsvDLTKvjKOVWQe8D5Li8znUOO0FExgLxxphPm1uQiNwoIqkikpqfn9/qsEp5m4mDorhsXF9e/O8utv1w1Oo4qotr84eiImID/gz8tqVpjTEvGWNSjDEp0dHRbV21Ul7h3ouH07ObP3d/tEkvC6As5U5B3wfEu7zu6xxWKxQYAXwtItnAGcBi/WBUdRU9ugXwwE+T2JRbxOurdlsdR3Vh7hT09cBgERkgIgHAbGBx7UhjTJExJsoYk2CMSQDWANONMantklgpLzRtVBznD4vh6c8zyCnUW9Ypa7RY0I0xVcCtwDIgHfjAGLNVRB4UkentHVCpzkBEeGjmCGwCd/1zEzXa9aIs4FYfujFmqTFmiDHmNGPMI85h9xtjFjcy7bl6dK66oj49grlvWiLf7izg7TV7rI6juiD9pqhSHnTF6fGcOzSaxz5LZ/ehY1bHUV2MFnSlPEhEeHzWKALsNn63KE3PelEdSgu6Uh7WKzyIB2eMYMOew7yycpfVcVQXogVdqXYwY3RvpiT14unPM8jIK7Y6juoitKAr1Q5EhIcvGUFIkB+//SCNyuoaqyOpLkALulLtJCokkEcvGcHmfUU8v2Kn1XFUF6AFXal2NGVEHDNH9+avX2WyZV+R1XGUj9OCrlQ7mz99BJEhAdz5wUbKq/Qyu6r9aEFXqp2Fd/Pn8Z+NIiOvhGe+0MvsqvajBV2pDnDe0Bhmnx7Pi9/sZPXOAqvjKB+lBV2pDnLftEQSIrtz+3vfU1BSbnUc5YO0oCvVQboH+vHslWM5crySOz9I0wt4KY/Tgq5UB0rsHcb90xL5JiOfl/RbpMrDtKAr1cHmTujHxSPjeHLZDjbsKbQ6jvIhWtCV6mAiwmM/G0nvHkH8+t2NHCmtsDqS8hFa0JWyQFiQP8/OGcvB4jJ+/+EmjNH+dNV2WtCVskhyfA/umjKM5dvyeOPbbKvjKB+gBV0pC1131gAuGBbDo0vT2ZR7xOo4qpPTgq6UhUSEpy5LJiokkFvf+Z6jZZVWR1KdmBZ0pSzWs3sAC+eMYd+R4/zfIr3BtDp1WtCV8gKnJ0Rwz9Rh/GfrAZ75IsPqOKqT8rM6gFLK4bqzBrDjQDELv8piUGwo05N7Wx1JdTJ6hK6Ul6i9y9HpCT35/aI0Nuboh6SqdbSgK+VFAv3svHDVOKJDA7nhrVT2Fx23OpLqRLSgK+VlIkMCefXq0yktr+KGt1IpraiyOpLqJLSgK+WFhvYKZeGcMWz94Si/W6RXZlTu0YKulJe6YHgs90wdxtLNB3jmS73TkWqZnuWilBe7YdJAMvNKWPhlJoNjQvipnvmimqFH6Ep5MdczX363KI3UbL3crmqaFnSlvFztmS99egRzzevr2ZxbZHUk5aXcKugiMkVEdohIlojc3cj4O0Vkm4hsEpEvRaS/56Mq1XVFhgTy9+snEBbsz89fW8uOA8VWR1JeqMWCLiJ24DlgKpAIzBGRxHqTfQ+kGGNGAR8Cf/J0UKW6ut49gnnnhgkE+tmY+8paduWXWB1JeRl3jtDHA1nGmF3GmArgPWCG6wTGmBXGmFLnyzVAX8/GVEoB9I/szj+un4AxhrmvrCWnsLTlmVSX4U5B7wPkuLzOdQ5rynXAZ42NEJEbRSRVRFLz8/PdT6mUOmFQTChvXzeBY+VVzH1lLXlHy6yOpLyERz8UFZGrgBTgycbGG2NeMsakGGNSoqOjPblqpbqUxN5hvHnteApKypn7yloKSsqtjqS8gDsFfR8Q7/K6r3NYHSJyIXAvMN0Yo+8updrZmH49eXXe6eQeLuXnr66jqFRvjtHVuVPQ1wODRWSAiAQAs4HFrhOIyBjgRRzF/KDnYyqlGnPGwEhe/HkKWQdL+MVrayk8VmF1JGWhFgu6MaYKuBVYBqQDHxhjtorIgyIy3TnZk0AIsEhENorI4iYWp5TysHOGRPO3q8ay/UAxP/vbt/pBaRcmxlhz0Z+UlBSTmppqybqV8kWp2YVc92Yq/nYbb1xzOiP6hFsdSbUDEdlgjElpbJx+U1QpH5GSEME/bzmTQD8bV7y4mpWZeiZZV6MFXSkfMigmlI9++SPiI7pxzevr+fj7XKsjqQ6kBV0pHxMbFsQHN5/J6QkR/Ob9NF74ZidWda2qjqUFXSkfFBbkzxvXns5Pk3vz+Gfbmf/vbVTrTTJ8nl4PXSkfFehn5y9XjCY2NJBX/reb3YeOseCK0UR0D7A6mmoneoSulK5iFBcAAA6XSURBVA+z2YQ/TEvk4ZkjWL2zgIv+spL1ek11n6UFXaku4Koz+vPRL39EkL+N2S+t4fmvs/Q+pT5IC7pSXcSIPuH8+7azmDqiF3/6zw6ueWO9frPUx2hBV6oLCQ3y569zxji6YHZpF4yv0YKuVBcjIo4umFtOdsE8tyKLquoaq6OpNtKCrlQXVdsFc9HIOJ5ctoOZz68iLeeI1bFUG2hBV6oLCw3yZ+Hs0Tw/dyz5xeXMfH4V93+yhaNleinezkgLulJdnIhw0cg4vrjzHK4+M4G/r9nDhU9/w5JNP+g3TDsZLehKKcBxtP7H6Un861cTiQ0L4tZ3vmfe6+vZW6CX4+0stKArpeoY1bcH//rVRB74aSIb9hzmxwu+4c+f76DouHbDeDst6EqpBuw24ZqJA/jiznO4MDGWhV9lMemJr1j4ZSbF2r/utfQGF0qpFm3ZV8QzX2TyRXoePbr5c8OkgVz9owRCAvVyUB2tuRtcaEFXSrltU+4Rnvkik6+2H6RnN39uOuc0fnFmf7oFaGHvKFrQlVIe9f3ewzzzRSbfZOQT2T2AKyf0Y874fvTuEWx1NJ+nBV0p1S427CnkuRU7WbHjIAKcPyyWq87ox9mDo7HZxOp4Pqm5gq7/JymlTtm4/hG8Ni+CnMJS3lm3lw/W5/BFeh79Irpx5YR+XJ4Sr9df70B6hK6U8pjyqmqWbc3j72v2sG53IQF2Gz8Z0YuLR8Zx7tBogvztVkfs9LTLRSnV4TLyivnHmj0sTvuBw6WVdAuwc/6wGC5yFnf9IPXUaEFXSlmmqrqGtbsL+XTzfpZtOUDBsQqC/G2cNzSGqSPjOGdINOHB/lbH7DS0oCulvEJ1jWHd7kI+27Kfz7YcIL+4HJvAyD7hTBwUxcRBUYzr31O7ZpqhBV0p5XWqawzf7T3MysxDrMo6xMacI1TXGAL8bKT078nEQVGceVokSb3DCPTTAl9LC7pSyuuVlFexbncBq7IKWJV1iO0HigHwtwvD48IY1Tec5L49SI7vwWnRIdi76GmRWtCVUp3OoZJy1u0uJC33CJtyiti8r4iS8ioAugfYSeoTTlLvMIbEhjI4JoTBMaGEd/P9vng9D10p1elEhQRy0cg4LhoZB0BNjWHXoRLScorYlHuEjblFvLcuh+OV1SfmiQkNZHCso7gPigmhf2Q34nt2o3ePYAL8fP9ahFrQlVKdgs0mDIoJZVBMKD8b1xdwFPl9R46TebCYzLwSMg86fhal5nCs4mShtwnEhQfTt2cw8RGOIt+3ZzC9woOIDQskJiyI0EA/RDp3N44WdKVUp2WziaNAR3Tj/GGxJ4YbY9hfVMbewlJyCkvJOXyc3MJS9haWsjIzn7yj5Q2WFexvP1HcY8OCiAoJIKJbAD27BxDZve5jj2B//Ozed8TvVkEXkSnAXwA78Iox5vF64wOBt4BxQAFwhTEm27NRlVLKPSJC7x7B9O4RzBkDIxuML6usZn9RGQePlpFXXO54PFrGgaPl5B0tY3PuEQpKKih29tk3JjTQj7Bgf0KDHI9hQf6EBfsRFuQY1j3Q+RNgdz760T3Q8bxXeBBhQZ7v72+xoIuIHXgO+DGQC6wXkcXGmG0uk10HHDbGDBKR2cATwBUeT9uZ5ayD7JWQMAnix3fedfiCnHWQ9i5gIPlKz7ZV7T4IjoTjBScfEyY5xnti/zS2n12Hua6n9nn9HO5sv+sy87ZB+icwfAakzHO24TtQkg8hMZA8p+Fy3H0/pr4B378FoXEw8faW28a1jQ+k1d2O2lyII5NrW8SPd6wr/ROCeo1iQFAYAxImQfL4ustOex/CHdtVOeIKCiNGU3isosFP+KHv6XU4lUM13fEvOcz6kiTWVQ3i6PFKBlVs4wxJ5/Oa4XxnhjBWMphlXwnAR9WTuGTGLH5+Rv/mt/MUtHiWi4icCfzRGPMT5+t7AIwxj7lMs8w5zWoR8QMOANGmmYV3qbNcctbBm9OhugLsAXD1Ys8X3I5Yhy/IWQdvTINq57/c9gCY96ln2qp2H1SVAzWAAAbEBjZ/x/Oa6rbtn8b2M5wcZvM7uZ4Tz6vA1AA2sPuBMVBT2fz2u65HxLGMWhPvgDXPO8bVsgfCvCV1/8C4835MfQOW3H7ytc0frlna/B+ZOm1cu/4AmPokfPb7k7ls/o62r6lyjJ9wE6x6xmVhAn5BJ7PlrIM3Lm5+uxq0T/nJtvULPLE/zIlt96fgrAeJ+O8fkBrHcmtsARy85EPiRp7T+Da2oLmzXNzpBOoD5Li8znUOa3QaY0wVUAQ0+D9HRG4UkVQRSc3Pz3cnu2/IXunYuaba8Zi9snOuwxfUtlOt6krPtdWJZdcWGufxjKlxDK+ubPv+aWw/1x/mup7qSmfBwZGruvJkMYemt991mTX1uh3SFzvmc1V/m9x9P6Z/Uvd1TQv7o0Ebu2xH+id1c9VU1s2QvrjewkzdbNkrW96uBtvn2rYn94dUVyCmGqmuJCrnP9hqKhEcf+LtNZXEHWmfg9kO7dU3xrxkjEkxxqRER0d35KqtlTDJcYQgdsdj7b+9nW0dvqC2nWrZ/T3XVieWXftr5TxjQmyO4Xb/tu+fxvZz/WGu67E7j1LBkcvu7/xvwamp7Xddpq1ez+zw6Y75XNXfJnffj8Nn1H1ta2F/NGhjl+0YPqNuLpt/3QzDp9dbmK1utoRJLW9Xg+1zbdsm9kf9XO34+6ldLh1F+9C9h/ahd/k+dHqNgqCwhtnc2a7GctS2bWP7o7Fcbdj/bfqmqLNAZwAXAPuA9cCVxpitLtP8ChhpjLnZ+aHoLGPM5c0tt8sVdKWU8oA2fVPUGFMlIrcCy3CctviaMWariDwIpBpjFgOvAm+LSBZQCMz2XHyllFLucOs8dGPMUmBpvWH3uzwvAy7zbDSllFKt4X1fdVJKKXVKtKArpZSP0IKulFI+Qgu6Ukr5CMtucCEi+cCeU5w9CjjkwTieorlaR3O1nrdm01yt05Zc/Y0xjX4z07KC3hYiktrUeZhW0lyto7laz1uzaa7Waa9c2uWilFI+Qgu6Ukr5iM5a0F+yOkATNFfraK7W89Zsmqt12iVXp+xDV0op1VBnPUJXSilVjxZ0pZTyEV5b0EXkMhHZKiI1ItLk6T0iMkVEdohIlojc7TJ8gIisdQ5/X0QCmlpGK3NFiMhyEcl0PvZsZJrzRGSjy0+ZiMx0jntDRHa7jBvdUbmc01W7rHuxy3Ar22u0iKx27u9NInKFyziPtldT7xeX8YHO7c9ytkeCy7h7nMN3iMhP2pLjFHLdKSLbnO3zpYj0dxnX6D7toFzzRCTfZf3Xu4y72rnfM0Xk6g7OtcAlU4aIHHEZ157t9ZqIHBSRLU2MFxFZ6My9SUTGuoxre3sZY7zyBxgODAW+BlKamMYO7AQGAgFAGpDoHPcBMNv5/AXgFg/l+hNwt/P53cATLUwfgeOSwt2cr98ALm2H9nIrF1DSxHDL2gsYAgx2Pu8N7Ad6eLq9mnu/uEzzS+AF5/PZwPvO54nO6QOBAc7l2Dsw13ku76FbanM1t087KNc84NlG5o0Adjkfezqf9+yoXPWmvw3HZb/btb2cyz4bGAtsaWL8RcBnOG5ndQaw1pPt5bVH6MaYdGPMjhYmGw9kGWN2GWMqgPeAGSIiwPnAh87p3gRmeijaDOfy3F3upcBnxphSD62/Ka3NdYLV7WWMyTDGZDqf/wAcBNrjHoWNvl+ayfshcIGzfWYA7xljyo0xu4Es5/I6JJcxZoXLe2gN0NdD625Trmb8BFhujCk0xhwGlgNTLMo1B3jXQ+tuljHmvzgO4JoyA3jLOKwBeohIHB5qL68t6G5q6gbWkcAR47hhtetwT4g1xux3Pj8AxLYw/Wwavpkecf67tUBEAjs4V5A4btS9prYbCC9qLxEZj+Ooa6fLYE+1V1tueO7OvO2Zy9V1OI7yajW2Tzsy18+c++dDEYlv5bztmQtn19QA4CuXwe3VXu5oKrtH2sutG1y0FxH5AujVyKh7jTGfNDK8QzSXy/WFMcaISJPnfTr/8o7EcbenWvfgKGwBOM5FvQt4sANz9TfG7BORgcBXIrIZR9E6ZR5ur7eBq405cTv1U24vXyQiVwEpwDkugxvsU2PMzsaX4HH/Bt41xpSLyE04/rs5v4PW7Y7ZwIfGmGqXYVa2V7uytKAbYy5s4yL2AfEur/s6hxXg+FfGz3mUVTu8zblEJE9E4owx+50F6GAzi7oc+NgYU+my7Nqj1XIReR34XUfmMsbscz7uEpGvgTHAP7G4vUQkDPgUxx/zNS7LPuX2akRT75fGpskVx/10w3G8n9yZtz1zISIX4vgjeY4xprx2eBP71BMFqsVcxpgCl5ev4PjMpHbec+vN+7UHMrmVy8Vs4FeuA9qxvdzRVHaPtFdn73JZDwwWxxkaATh23mLj+JRhBY7+a4CrAU8d8S92Ls+d5Tbou3MWtdp+65lAo5+Gt0cuEelZ22UhIlHARGCb1e3l3Hcf4+hb/LDeOE+2V6Pvl2byXgp85WyfxcBscZwFMwAYDKxrQ5ZW5RKRMcCLwHRjzEGX4Y3u0w7MFefycjqQ7ny+DJjszNcTmEzd/1TbNZcz2zAcHzCudhnWnu3ljsXAL5xnu5wBFDkPWjzTXu31aW9bf4BLcPQjlQN5wDLn8N7AUpfpLgIycPyFvddl+EAcv3BZwCIg0EO5IoEvgUzgCyDCOTwFeMVlugQcf3Vt9eb/CtiMozD9HQjpqFzAj5zrTnM+XucN7QVcBVQCG11+RrdHezX2fsHRhTPd+TzIuf1ZzvYY6DLvvc75dgBTPfx+bynXF87fg9r2WdzSPu2gXI8BW53rXwEMc5n3Wmc7ZgHXdGQu5+s/Ao/Xm6+92+tdHGdpVeKoX9cBNwM3O8cL8Jwz92ZczuDzRHvpV/+VUspHdPYuF6WUUk5a0JVSykdoQVdKKR+hBV0ppXyEFnSllPIRWtCVUspHaEFXSikf8f8BeYdSbDLcQYsAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "     pcost       dcost       gap    pres   dres\n",
      " 0: -3.4810e+03 -9.7565e+04  1e+05  7e-02  4e-16\n",
      " 1: -3.4997e+03 -5.3183e+03  2e+03  7e-04  4e-16\n",
      " 2: -3.5029e+03 -3.5825e+03  8e+01  3e-05  3e-16\n",
      " 3: -3.5035e+03 -3.5100e+03  7e+00  2e-06  3e-16\n",
      " 4: -3.5036e+03 -3.5040e+03  4e-01  1e-07  3e-16\n",
      " 5: -3.5036e+03 -3.5037e+03  2e-02  3e-09  3e-16\n",
      " 6: -3.5036e+03 -3.5036e+03  8e-04  3e-11  3e-16\n",
      "Optimal solution found.\n",
      "     pcost       dcost       gap    pres   dres\n",
      " 0: -3.3507e+03 -9.7403e+04  1e+05  7e-02  5e-16\n",
      " 1: -3.3692e+03 -5.1857e+03  2e+03  7e-04  5e-16\n",
      " 2: -3.3720e+03 -3.4417e+03  7e+01  2e-05  4e-16\n",
      " 3: -3.3727e+03 -3.3771e+03  5e+00  1e-06  3e-16\n",
      " 4: -3.3728e+03 -3.3730e+03  2e-01  6e-08  3e-16\n",
      " 5: -3.3728e+03 -3.3728e+03  1e-02  1e-09  3e-16\n",
      " 6: -3.3728e+03 -3.3728e+03  8e-04  1e-11  3e-16\n",
      "Optimal solution found.\n",
      "     pcost       dcost       gap    pres   dres\n",
      " 0: -3.4105e+03 -9.7444e+04  1e+05  7e-02  5e-16\n",
      " 1: -3.4289e+03 -5.2448e+03  2e+03  7e-04  5e-16\n",
      " 2: -3.4320e+03 -3.5040e+03  8e+01  3e-05  4e-16\n",
      " 3: -3.4324e+03 -3.4367e+03  4e+00  1e-06  3e-16\n",
      " 4: -3.4326e+03 -3.4328e+03  2e-01  6e-08  4e-16\n",
      " 5: -3.4326e+03 -3.4326e+03  1e-02  2e-09  3e-16\n",
      " 6: -3.4326e+03 -3.4326e+03  7e-04  2e-11  3e-16\n",
      "Optimal solution found.\n"
     ]
    }
   ],
   "source": [
    "import numpy as np\n",
    "from numpy import genfromtxt\n",
    "from sklearn import svm\n",
    "from sklearn.metrics import accuracy_score\n",
    "import random\n",
    "import matplotlib.pyplot as plt\n",
    "import xgboost as xgb\n",
    "from xgboost import XGBClassifier\n",
    "from sklearn.tree import DecisionTreeClassifier\n",
    "from sklearn import svm\n",
    "from sklearn.linear_model import LogisticRegression\n",
    "import statsmodels.api as sm\n",
    "import numpy.linalg as LA\n",
    "import scipy\n",
    "import sys\n",
    "from cvxopt import matrix, solvers\n",
    "import scipy.io as sio\n",
    "def V_matrix_Huang(T,X,n_t):\n",
    "  l = len(X)\n",
    "  m = len(T)\n",
    "  V = np.identity(l)\n",
    "  P = matrix(gram_matrix(X))\n",
    "  K = Kernel.gaussian(1)\n",
    "  sum_T = [0 for i in range(l)]\n",
    "  for i in range(l):\n",
    "    for t in range(m):\n",
    "      sum_T[i]+=K(T[t],X[i])\n",
    "    sum_T[i] = -1*l/m*sum_T[i]  \n",
    "  q = matrix(sum_T)\n",
    "  G = [[0]*l for i in range(2*l+2)]\n",
    "  for i in range(l):\n",
    "    G[i][i] = 1\n",
    "    G[i+1][i] = -1\n",
    "  for j in range(l):\n",
    "    G[2*l][j] = 1\n",
    "    G[2*l+1][j] = -1\n",
    " \n",
    "  G = matrix(np.array(G),tc ='d')\n",
    "  B = 10\n",
    "  eps = 1-1/np.sqrt(l)\n",
    "  h = [0 for i in range(2*l+2)]\n",
    "  for i in range(l):\n",
    "    h[i] = B\n",
    "  h[2*l] = l+l*eps\n",
    "  h[2*l+1] = l-l*eps   \n",
    "  h = matrix(h)\n",
    "  sol = solvers.qp(P,q,G,h)\n",
    "  solution = np.array(sol['x'])\n",
    "  diagonal = [solution[i][0] for i in range(l)]\n",
    "  V = np.diag(diagonal)\n",
    "  return V \n",
    "\n",
    "def V_matrix_new(T,X,n_t):\n",
    "  l = len(X)\n",
    "  V_3 = np.identity(l) # our V\n",
    "  for i in range(l):\n",
    "    for j in range(l):\n",
    "      V_3[i,j] = 0\n",
    "      for t in T:\n",
    "        if t >= np.maximum(X[i],X[j]):\n",
    "          V_3[i,j]+= 1\n",
    "      V_3[i,j] = V_3[i,j]/n_t \n",
    "  return V_3    \n",
    "def unif_kernel(x,X,h):\n",
    "  n = len(X)\n",
    "  val = 0\n",
    "  for i in range(n):\n",
    "    if np.abs((x-X[i])/h) <=1:\n",
    "      val+= 0.5\n",
    "    \n",
    "  q = val/(n*h)\n",
    "  return q\n",
    "def gauss_kernel(x,X,h):\n",
    "  n = len(X)\n",
    "  val = 0\n",
    "  for i in range(n):\n",
    "    val+=1/(np.sqrt(2*np.pi))*(np.exp(-((x-X[i])/h)**2/2))\n",
    "  q = val/(n*h)\n",
    "  return q\n",
    "def V_matrix_Shimodaira(T,X,n_t,h):\n",
    "  l = len(X)\n",
    "  V_1 = np.identity(l)\n",
    "  a = 0.3\n",
    "  for i in range(l):\n",
    "    l_1 = gauss_kernel(X[i],T,h)\n",
    "    l_0 = gauss_kernel(X[i],X,h)\n",
    "    V_1[i,i] = l_1/l_0\n",
    "  return V_1\n",
    "def V_matrix_Sugiyama(T,X,n_t,h,tau):\n",
    "  l = len(X)\n",
    "  V_1 = np.identity(l)\n",
    "  for i in range(l):\n",
    "    l_1 = gauss_kernel(X[i],T,h)\n",
    "    l_0 = gauss_kernel(X[i],X,h)\n",
    "    V_1[i,i] = (l_1/l_0)**tau\n",
    "  return V_1 \n",
    "def V_matrix_Makoto(T,X,n_t,h,a):\n",
    "  l = len(X)\n",
    "  V_1 = np.identity(l)\n",
    "  for i in range(l):\n",
    "    l_1 = gauss_kernel(X[i],T,h)\n",
    "    l_0 = gauss_kernel(X[i],X,h)\n",
    "    V_1[i,i] = l_1/(a*l_0+(1-a)*l_1)\n",
    "  return V_1  \n",
    "\"\"\"Using direct closed form solution for conditional probability distribution from Vapnik's paper for VSVM problem\n",
    "\n",
    "---\n",
    "\n",
    "\n",
    "P(y=1|x)  = A^T\\mathcal{K}+c\n",
    "\n",
    "---\n",
    "\n",
    "\n",
    "A = A_b - cA_c\n",
    "\n",
    "---\n",
    "\n",
    "\n",
    "A_b  \n",
    "\n",
    "---\n",
    "\n",
    "\n",
    "A_c \n",
    "\n",
    "---\n",
    "\n",
    "\n",
    "c \n",
    "\n",
    "---\n",
    "\n",
    "\n",
    "\\mathcal{K} = [...K(x,x_i)...]^T \n",
    "\n",
    "---\n",
    "U = [---K(x_i,x_j)--] where x_i, x_j are the ith and jth sample form training data and K is the kernel.\n",
    "\n",
    "---\n",
    "\n",
    "Y= (y_1, y_2, ...., y_n) training labels\n",
    "\"\"\"\n",
    "\n",
    "def test_methods(T,X,Y,V_1,V_2,V_3,V_4):\n",
    "  U = gram_matrix(X)# get the gram matrix for the given training set X\n",
    "  g = 0.1  \n",
    "  A_1,c_1 = A_estimate(V_1,U,Y,g)\n",
    "  A_2,c_2 = A_estimate(V_2,U,Y,g)\n",
    "  A_3,c_3 = A_estimate(V_3,U,Y,g)\n",
    "  A_4,c_4 = A_estimate(V_4,U,Y,g)\n",
    "  p_1 = []\n",
    "  p_2 = []\n",
    "  p_3 = []\n",
    "  p_4 = []\n",
    "  T = np.sort(T)\n",
    "  p_exp = np.array([1/(1+np.exp(5*t))for t in T])\n",
    "  for t in range(len(T)):\n",
    "    U_l = style_K(X,T[t]) #U_l = # kernel for the test set\n",
    "    p_1.append(p_estimate(A_1,c_1,U_l))\n",
    "    p_2.append(p_estimate(A_2,c_2,U_l))\n",
    "    p_3.append(p_estimate(A_3,c_3,U_l))\n",
    "    p_4.append(p_estimate(A_4,c_4,U_l))\n",
    "  p_1 = np.array(p_1)\n",
    "  p_2 = np.array(p_2)\n",
    "  p_3 = np.array(p_3)\n",
    "  p_4 = np.array(p_4)\n",
    "  error_1 = LA.norm(p_exp-p_1)/len(T)\n",
    "  error_2 = LA.norm(p_exp-p_2)/len(T)\n",
    "  error_3 = LA.norm(p_exp-p_3)/len(T)\n",
    "  error_4 = LA.norm(p_exp-p_4)/len(T)\n",
    "  return error_1,error_2,error_3,error_4\n",
    "def test_methods_review(T,X,Y,V_5):\n",
    "  U = gram_matrix(X)# get the gram matrix for the given training set X\n",
    "  g = 0.1  \n",
    "  A_5, c_5 = A_estimate(V_5,U,Y,g)\n",
    "  p_5 = []\n",
    "  T = np.sort(T)\n",
    "  p_exp = np.array([1/(1+np.exp(5*t))for t in T])\n",
    "  for t in range(len(T)):\n",
    "    U_l = style_K(X,T[t]) #U_l = # kernel for the test set\n",
    "    p_5.append(p_estimate(A_5,c_5,U_l))\n",
    "  p_5 = np.array(p_5)\n",
    "  error_5 = LA.norm(p_exp-p_5)/len(T)\n",
    "  return error_5 \n",
    "#Estimate of A and c\n",
    "def A_estimate(V,U,Y,g):\n",
    "  l = V.shape[0]\n",
    "  I = np.identity(l)\n",
    "  O = np.ones((l,1))\n",
    "  a_1 = np.matmul(V,U)\n",
    "  a_2 = np.matmul(V,Y.reshape(l,1))\n",
    "  a_3 = np.matmul(V,O)\n",
    "  T = np.linalg.inv(a_1+g*I) # g:regularization constant\n",
    "  A_b = np.matmul(T,a_2).reshape(l,1) \n",
    "  A_c = np.matmul(T,a_3).reshape(l,1) \n",
    "  c_1 = np.matmul(O.transpose(),np.matmul(a_1,A_b)-a_2) \n",
    "  c_2 = np.matmul(O.transpose(),np.matmul(a_1,A_c)-a_3)\n",
    "  c = c_1/c_2 \n",
    "  A = A_b - c[0,0]*A_c\n",
    "  return A,c\n",
    "#Conditional probability estimate for a given x\n",
    "def p_estimate(A,c,U_l):\n",
    "  p = np.matmul(A.transpose(),U_l)+c\n",
    "  return p[0,0] \n",
    "\n",
    "def gram_matrix(X):\n",
    "   l = X.shape[0]\n",
    "   U = np.zeros((l,l))\n",
    "   K = Kernel.gaussian(1)         \n",
    "   for i in range(l):\n",
    "     for j in range(l):\n",
    "       U[i,j] = K(X[i],X[j])\n",
    "   return U\n",
    "def style_K(X,t):\n",
    "   l = X.shape[0]\n",
    "   U_l = np.zeros((l,1))\n",
    "   K = Kernel.gaussian(1)\n",
    "   for i in range(l):\n",
    "     U_l[i] = K(t,X[i])    \n",
    "   return U_l  \n",
    "class SVMTrainer(object):\n",
    "    def __init__(self, kernel, c):\n",
    "        self._kernel = kernel\n",
    "        self._c = c\n",
    "\n",
    "    def train(self, X, y):\n",
    "        \"\"\"Given the training features X with labels y, returns a SVM\n",
    "        predictor representing the trained SVM.\n",
    "        \"\"\"\n",
    "        lagrange_multipliers = self._compute_multipliers(X, y)\n",
    "        return self._construct_predictor(X, y, lagrange_multipliers)\n",
    "\n",
    "    def _gram_matrix(self, X):\n",
    "        n_samples, n_features = X.shape\n",
    "        K = np.zeros((n_samples, n_samples))\n",
    "        # TODO(tulloch) - vectorize\n",
    "        for i, x_i in enumerate(X):\n",
    "            for j, x_j in enumerate(X):\n",
    "                K[i, j] = self._kernel(x_i, x_j)\n",
    "        return K\n",
    "\n",
    "    def _construct_predictor(self, X, y, lagrange_multipliers):\n",
    "        support_vector_indices = \\\n",
    "            lagrange_multipliers > MIN_SUPPORT_VECTOR_MULTIPLIER\n",
    "\n",
    "        support_multipliers = lagrange_multipliers[support_vector_indices]\n",
    "        support_vectors = X[support_vector_indices]\n",
    "        support_vector_labels = y[support_vector_indices]\n",
    "\n",
    "        # http://www.cs.cmu.edu/~guestrin/Class/10701-S07/Slides/kernels.pdf\n",
    "        # bias = y_k - \\sum z_i y_i  K(x_k, x_i)\n",
    "        # Thus we can just predict an example with bias of zero, and\n",
    "        # compute error.\n",
    "        bias = np.mean(\n",
    "            [y_k - SVMPredictor(\n",
    "                kernel=self._kernel,\n",
    "                bias=0.0,\n",
    "                weights=support_multipliers,\n",
    "                support_vectors=support_vectors,\n",
    "                support_vector_labels=support_vector_labels).predict(x_k)\n",
    "             for (y_k, x_k) in zip(support_vector_labels, support_vectors)])\n",
    "\n",
    "        return SVMPredictor(\n",
    "            kernel=self._kernel,\n",
    "            bias=bias,\n",
    "            weights=support_multipliers,\n",
    "            support_vectors=support_vectors,\n",
    "            support_vector_labels=support_vector_labels)\n",
    "\n",
    "    def _compute_multipliers(self, X, y):\n",
    "        n_samples, n_features = X.shape\n",
    "\n",
    "        K = self._gram_matrix(X)\n",
    "        # Solves\n",
    "        # min 1/2 x^T P x + q^T x\n",
    "        # s.t.\n",
    "        #  Gx \\coneleq h\n",
    "        #  Ax = b\n",
    "\n",
    "        P = cvxopt.matrix(np.outer(y, y) * K)\n",
    "        q = cvxopt.matrix(-1 * np.ones(n_samples))\n",
    "\n",
    "        # -a_i \\leq 0\n",
    "        # TODO(tulloch) - modify G, h so that we have a soft-margin classifier\n",
    "        G_std = cvxopt.matrix(np.diag(np.ones(n_samples) * -1))\n",
    "        h_std = cvxopt.matrix(np.zeros(n_samples))\n",
    "\n",
    "        # a_i \\leq c\n",
    "        G_slack = cvxopt.matrix(np.diag(np.ones(n_samples)))\n",
    "        h_slack = cvxopt.matrix(np.ones(n_samples) * self._c)\n",
    "\n",
    "        G = cvxopt.matrix(np.vstack((G_std, G_slack)))\n",
    "        h = cvxopt.matrix(np.vstack((h_std, h_slack)))\n",
    "\n",
    "        A = cvxopt.matrix(y, (1, n_samples))\n",
    "        b = cvxopt.matrix(0.0)\n",
    "\n",
    "        solution = cvxopt.solvers.qp(P, q, G, h, A, b)\n",
    "\n",
    "        # Lagrange multipliers\n",
    "        return np.ravel(solution['x'])\n",
    "class SVMPredictor(object):\n",
    "    def __init__(self,\n",
    "                 kernel,\n",
    "                 bias,\n",
    "                 weights,\n",
    "                 support_vectors,\n",
    "                 support_vector_labels):\n",
    "        self._kernel = kernel\n",
    "        self._bias = bias\n",
    "        self._weights = weights\n",
    "        self._support_vectors = support_vectors\n",
    "        self._support_vector_labels = support_vector_labels\n",
    "\n",
    "    def predict(self, x):\n",
    "        \"\"\"\n",
    "        Computes the SVM prediction on the given features x.\n",
    "        \"\"\"\n",
    "        result = self._bias\n",
    "        for z_i, x_i, y_i in zip(self._weights,\n",
    "                                 self._support_vectors,\n",
    "                                 self._support_vector_labels):\n",
    "            result += z_i * y_i * self._kernel(x_i, x)\n",
    "        return np.sign(result).item()   \n",
    "import numpy.linalg as la\n",
    "\n",
    "\n",
    "class Kernel(object):\n",
    "    \"\"\"Implements list of kernels from\n",
    "    http://en.wikipedia.org/wiki/Support_vector_machine\n",
    "    \"\"\"\n",
    "    @staticmethod\n",
    "    def linear():\n",
    "        def f(x, y):\n",
    "            return np.inner(x, y)\n",
    "        return f\n",
    "\n",
    "    @staticmethod\n",
    "    def gaussian(sigma):\n",
    "        def f(x, y):\n",
    "            exponent = -np.sqrt(la.norm(x-y)**2  / (2 * sigma ** 2))\n",
    "            return np.exp(exponent)\n",
    "        return f\n",
    "\n",
    "    @staticmethod\n",
    "    def _polykernel(dimension, offset):\n",
    "        def f(x, y):\n",
    "            return (offset + np.dot(x, y)) ** dimension\n",
    "        return f\n",
    "\n",
    "    @staticmethod\n",
    "    def inhomogenous_polynomial(dimension):\n",
    "        return Kernel._polykernel(dimension=dimension, offset=1.0)\n",
    "\n",
    "    @staticmethod\n",
    "    def homogenous_polynomial(dimension):\n",
    "        return Kernel._polykernel(dimension=dimension, offset=0.0)\n",
    "\n",
    "    @staticmethod\n",
    "    def hyperbolic_tangent(kappa, c):\n",
    "        def f(x, y):\n",
    "            return np.tanh(kappa * np.dot(x, y) + c)\n",
    "        return f\n",
    "\"\"\"We start by sampling points randomly from -1 to 1\"\"\"\n",
    "def random_labels(X, prob):\n",
    "  y = []\n",
    "  for x in X:\n",
    "    if random.random() < prob(x):\n",
    "      y.append(1)\n",
    "    else:\n",
    "      y.append(0)\n",
    "  return np.array(y)\n",
    "def check_methods():\n",
    "  number_of_points = 100 #Number of training points\n",
    "  l = number_of_points\n",
    "  X = (2 * (np.random.rand(number_of_points))) - 1\n",
    "  balance = 0.5 #training data balance\n",
    "  for i in range(number_of_points):\n",
    "      num = np.random.rand(1)\n",
    "      if num < balance:\n",
    "        X[i]=np.random.rand(1)-1\n",
    "      else:\n",
    "        X[i]=np.random.rand(1)   \n",
    "      X = np.array(X)  \n",
    "      X = np.squeeze(X)\n",
    "\n",
    "      \n",
    "\n",
    "  p = lambda x: 1/(1 + np.exp(5* x)) # the probability of x being labeled y=1\n",
    "  Y = random_labels(X, p)\n",
    "  print(Y.shape)\n",
    "  xs = [-1 + (i/20) for i in range(41)]\n",
    "  true_p = [p(x) for x in xs]\n",
    "  plt.plot(xs, true_p, label='p(y=1|x)')\n",
    "  plt.plot(X, Y, '.', label='Data')\n",
    "  plt.legend(loc='best')\n",
    "  plt.show()\n",
    "  l = number_of_points\n",
    "  V_1 = np.identity(l) # without Vapnik\n",
    "  V_2 = np.identity(l) # Vapnik \n",
    "  for i in range(l):\n",
    "    for j in range(l):\n",
    "      V_2[i,j] = 1-np.maximum(X[i],X[j])\n",
    "\n",
    "  \"\"\"We label the points according a Sigmoid function\"\"\"\n",
    "\n",
    "  n_t_array = [i for i in range(100,550,100)] # number of test points\n",
    "  h = 2\n",
    "  E_1 = []\n",
    "  E_2 = []\n",
    "  E_3 = []\n",
    "  E_4 = []\n",
    "  balance = 0.7 #test data balance\n",
    "  tau = [0.3]\n",
    "  alpha = [0.3]\n",
    "  E_5 = [[] for ta in tau]\n",
    "  E_6 = [[] for alph in alpha]\n",
    "  E_7 = []\n",
    "  D = []\n",
    "  D.append(X)\n",
    "  D.append(Y)\n",
    "  ctr = 1\n",
    "  for n_t in n_t_array:\n",
    "    T = (2 * (np.random.rand(n_t))) - 1\n",
    "    for i in range(n_t):\n",
    "      num = np.random.rand(1)\n",
    "      if num < balance:\n",
    "        T[i]=np.random.rand(1)-1\n",
    "      else:\n",
    "        T[i]=np.random.rand(1)   \n",
    "    T = np.array(T)  \n",
    "    T = np.squeeze(T)\n",
    "    D.append(T)\n",
    "    V_3= V_matrix_new(T,X,n_t) \n",
    "    V_4 = V_matrix_Shimodaira(T,X,n_t,h) \n",
    "    error_1,error_2,error_3, error_4 = test_methods(T,X,Y,V_1,V_2,V_3,V_4)  \n",
    "    E_1.append(error_1)\n",
    "    E_2.append(error_2)\n",
    "    E_3.append(error_3)\n",
    "    E_4.append(error_4)\n",
    "    for ta in range(len(tau)):\n",
    "      V_5 = V_matrix_Sugiyama(T,X,n_t,h,tau[ta])\n",
    "      error_5 = test_methods_review(T,X,Y,V_5)\n",
    "      E_5[ta].append(error_5)\n",
    "    for alph in range(len(alpha)):\n",
    "      V_6 = V_matrix_Makoto(T,X,n_t,h,alpha[alph])  \n",
    "      error_6 = test_methods_review(T,X,Y,V_6)\n",
    "      E_6[alph].append(error_6)\n",
    "    V_7 = V_matrix_Huang(T,X,n_t)\n",
    "    error_7 = test_methods_review(T,X,Y,V_7) \n",
    "    E_7.append(error_7) \n",
    "    ctr+=1  \n",
    "  return E_1,E_2,E_3,E_4,E_5[0],E_6[0],E_7,D  \n",
    "M = 1\n",
    "E_big_1 = [[] for i in range(M)]  \n",
    "E_big_2 = [[] for i in range(M)]  \n",
    "E_big_3 = [[] for i in range(M)]  \n",
    "E_big_4 = [[] for i in range(M)]  \n",
    "E_big_5 = [[] for i in range(M)]  \n",
    "E_big_6 = [[] for i in range(M)]  \n",
    "E_big_7 = [[] for i in range(M)]  \n",
    "n_t_array = [i for i in range(100,550,100)]\n",
    "U = {}\n",
    "for i in range(M):\n",
    "  E_big_1[i], E_big_2[i], E_big_3[i],E_big_4[i],E_big_5[i],E_big_6[i],E_big_7[i],D = check_methods()\n",
    "  U['pass_'+str(i)] = D\n",
    "sio.savemat('data.mat',U)\n",
    "E_big_1 = np.array([np.array(E_big_1[i]) for i in range(M)])  \n",
    "E_big_2 = np.array([np.array(E_big_2[i]) for i in range(M)])  \n",
    "E_big_3 = np.array([np.array(E_big_3[i]) for i in range(M)])  \n",
    "E_big_4 = np.array([np.array(E_big_4[i]) for i in range(M)])  \n",
    "E_big_5 = np.array([np.array(E_big_5[i]) for i in range(M)])  \n",
    "E_big_6 = np.array([np.array(E_big_6[i]) for i in range(M)])  \n",
    "E_big_7 = np.array([np.array(E_big_7[i]) for i in range(M)])   \n",
    "E_1_mean = []\n",
    "E_2_mean = []\n",
    "E_3_mean = []\n",
    "E_4_mean = []\n",
    "E_5_mean = []\n",
    "E_6_mean = []\n",
    "E_7_mean = []\n",
    "E_1_std = []\n",
    "E_2_std = []\n",
    "E_3_std = []\n",
    "E_4_std = []\n",
    "E_5_std = []\n",
    "E_6_std = []\n",
    "E_7_std = []\n",
    "for i in range(len(n_t_array)):\n",
    "  E_1_mean.append(np.mean(E_big_1[:,i]))\n",
    "  E_2_mean.append(np.mean(E_big_2[:,i]))\n",
    "  E_3_mean.append(np.mean(E_big_3[:,i]))\n",
    "  E_4_mean.append(np.mean(E_big_4[:,i]))\n",
    "  E_5_mean.append(np.mean(E_big_5[:,i]))\n",
    "  E_6_mean.append(np.mean(E_big_6[:,i]))\n",
    "  E_7_mean.append(np.mean(E_big_7[:,i]))\n",
    "  E_1_std.append(np.std(E_big_1[:,i]))\n",
    "  E_2_std.append(np.std(E_big_2[:,i]))\n",
    "  E_3_std.append(np.std(E_big_3[:,i]))\n",
    "  E_4_std.append(np.std(E_big_4[:,i]))\n",
    "  E_5_std.append(np.std(E_big_5[:,i]))\n",
    "  E_6_std.append(np.std(E_big_6[:,i]))\n",
    "  E_7_std.append(np.std(E_big_7[:,i]))\n",
    "np.savetxt('V_1_mean.csv', E_1_mean, delimiter=\",\")\n",
    "np.savetxt('V_1_std.csv', E_1_std, delimiter=\",\")  \n",
    "np.savetxt('V_2_mean.csv', E_2_mean, delimiter=\",\")\n",
    "np.savetxt('V_2_std.csv', E_2_std, delimiter=\",\") \n",
    "np.savetxt('V_3_mean.csv', E_3_mean, delimiter=\",\")\n",
    "np.savetxt('V_3_std.csv', E_3_std, delimiter=\",\") \n",
    "np.savetxt('V_4_mean.csv', E_4_mean, delimiter=\",\")\n",
    "np.savetxt('V_4_std.csv', E_4_std, delimiter=\",\") \n",
    "np.savetxt('V_5_mean.csv', E_5_mean, delimiter=\",\")\n",
    "np.savetxt('V_5_std.csv', E_5_std, delimiter=\",\") \n",
    "np.savetxt('V_6_mean.csv', E_6_mean, delimiter=\",\")\n",
    "np.savetxt('V_6_std.csv', E_6_std, delimiter=\",\") \n",
    "np.savetxt('V_7_mean.csv', E_7_mean, delimiter=\",\")\n",
    "np.savetxt('V_7_std.csv', E_7_std, delimiter=\",\") \n",
    "plt.errorbar(n_t_array,E_1_mean,E_1_std,marker='x', label='V = I',capsize = 5) # No Vapnik\n",
    "plt.errorbar(n_t_array,E_2_mean,E_2_std,marker= '+',label='V in Vapnik',capsize = 5) # Vapnik V\n",
    "plt.errorbar(n_t_array, E_3_mean,E_3_std,marker='d', label = 'Proposed V',capsize = 5) #Our V\n",
    "plt.errorbar(n_t_array, E_4_mean,E_4_std,marker='*', label = 'Shimodaira',capsize = 5) #Shimodaira\n",
    "plt.errorbar(n_t_array, E_7_mean,E_7_std,marker='d', label = 'Huang',capsize = 5) #Huang\n",
    "plt.errorbar(n_t_array, E_5_mean,E_5_std,marker='*', label = 'Sugiyama',capsize = 5) #Sugiyama\n",
    "plt.errorbar(n_t_array, E_6_mean,E_6_std,marker='d', label = 'Makoto',capsize = 5) #Makoto\n",
    "plt.legend(loc='best')\n",
    "plt.xlabel('Number of test points')\n",
    "plt.ylabel('Normalized L2-error')\n",
    "plt.grid()\n",
    "plt.savefig('Comparison_5_7_new.png')\n",
    "\"\"\"(1) Stability of estimated probability curve is controlled by number of training points.\n",
    "Result: Both Vapnik and our method are more stable than classical SVM. \n",
    "\n",
    "---\n",
    "\n",
    "(2) Test distribution is not uniform and is instead chosen to be \"biased\" towards one half, meaning the probability that a point in the test set distribution falls in the range [0,1] is given by balance. For unifrom distribution in [-1,1], balance = 0.5. If we want probability of range [0,1] to be 0.7, balance = 0.3.  \n",
    "\n",
    "---\n",
    "\n",
    "(3) The empirical estimate of test distribution becomes better with more test data n_t. Our method performs better than Vapnik  when the L2-error is compared for the conditional probability estimates.\n",
    "\"\"\"\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "name": "Vapnik_Review",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
