UCI糖尿病数据利用逻辑回归算法进行训练和预测

UCI糖尿病数据利用逻辑回归算法进行训练和预测
jupyter

{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "diabetes_data = pd.read_csv('diabetes.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Pregnancies</th>\n",
       "      <th>Glucose</th>\n",
       "      <th>BloodPressure</th>\n",
       "      <th>SkinThickness</th>\n",
       "      <th>Insulin</th>\n",
       "      <th>BMI</th>\n",
       "      <th>DiabetesPedigreeFunction</th>\n",
       "      <th>Age</th>\n",
       "      <th>Outcome</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>6</td>\n",
       "      <td>148</td>\n",
       "      <td>72</td>\n",
       "      <td>35</td>\n",
       "      <td>0</td>\n",
       "      <td>33.6</td>\n",
       "      <td>0.627</td>\n",
       "      <td>50</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>85</td>\n",
       "      <td>66</td>\n",
       "      <td>29</td>\n",
       "      <td>0</td>\n",
       "      <td>26.6</td>\n",
       "      <td>0.351</td>\n",
       "      <td>31</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>8</td>\n",
       "      <td>183</td>\n",
       "      <td>64</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>23.3</td>\n",
       "      <td>0.672</td>\n",
       "      <td>32</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1</td>\n",
       "      <td>89</td>\n",
       "      <td>66</td>\n",
       "      <td>23</td>\n",
       "      <td>94</td>\n",
       "      <td>28.1</td>\n",
       "      <td>0.167</td>\n",
       "      <td>21</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0</td>\n",
       "      <td>137</td>\n",
       "      <td>40</td>\n",
       "      <td>35</td>\n",
       "      <td>168</td>\n",
       "      <td>43.1</td>\n",
       "      <td>2.288</td>\n",
       "      <td>33</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Pregnancies  Glucose  BloodPressure  SkinThickness  Insulin   BMI  \\\n",
       "0            6      148             72             35        0  33.6   \n",
       "1            1       85             66             29        0  26.6   \n",
       "2            8      183             64              0        0  23.3   \n",
       "3            1       89             66             23       94  28.1   \n",
       "4            0      137             40             35      168  43.1   \n",
       "\n",
       "   DiabetesPedigreeFunction  Age  Outcome  \n",
       "0                     0.627   50        1  \n",
       "1                     0.351   31        0  \n",
       "2                     0.672   32        1  \n",
       "3                     0.167   21        0  \n",
       "4                     2.288   33        1  "
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "diabetes_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "def sigmoid(z):\n",
    "    return 1 / (1 + np.exp(-z))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.5"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sigmoid(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x1dd0d80a908>]"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXcAAAD8CAYAAACMwORRAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDIuMi4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvhp/UCwAAHelJREFUeJzt3Xt8VPWd//HXh4SLCoiCpCoWoaAuVrcaxKK2QnUtUITaFcSu1l7Z/rr0113b3wraosW2q7v667Yr2iurpR0Q6w01Sisk+rCKAq2goEikXrIgeEMIKBDy2T++ExziJDOZ25nL+/l4nEfOmfOdyZuTySdfvnPO+Zq7IyIi5aVb1AFERCT3VNxFRMqQiruISBlScRcRKUMq7iIiZUjFXUSkDKm4i4iUIRV3EZEypOIuIlKGqqP6xgMGDPBjjz02o+fu3LmTQw45JLeBckj5sqN82Sv2jMqXuVWrVr3h7kekbOjukSy1tbWeqfr6+oyfWwjKlx3ly16xZ1S+zAErPY0aq2EZEZEypOIuIlKGVNxFRMqQiruISBlScRcRKUMpi7uZzTOzrWb2bAf7zcx+amaNZrbGzE7NfUwREemKdHrutwLjOtk/HhgeX6YDt2QfS0REspHyIiZ3f9TMju2kyWTgN/HzL5ebWT8zO9LdN+coo4hI4A7vvgu7d0NLC+zd27Wl7TmtrQcu7gdsH/X88/Dssx9s19Y2cWnL1ZX188+H007L66HKxRWqRwOvJmw3xR/7QHE3s+mE3j01NTU0NDRk9A2bm5szfm4hKF92lC97xZqxescOem3eTM/XX+eZxx6jetcuqnbt2v815fq772KtrXnPeVweX9vN2NDczKadO/P4XXJT3C3JY0ln3Xb3XwC/ABg5cqSPGTMmo2/Y0NBAps8tBOXLjvJlL7KM7rB1KzQ2huXFFw9cf+utjp9bVQV9+0KfPmHp2xf6939/ve3x3r2hZ0/o3r3rS3V1+FpVBd26hcXs/fX48qfHH+fMT3ziA49j9n57eH873XVCwTyO/P4BgdwU9ybgmITtQcCmHLyuiBSj1lZoajqweCcW8cQeabduMHgwDBsGF10EH/kIDB3KX15+mVPOPvvAwt2r1wFFMEp7DzsMBgyIOkZWclHcFwMzzGwhcDrwjsbbRcpMSwssXQrz58M99xxYwHv0gCFDQgEfMyYU8GHDwjJ4cNjfzjsNDXDKKQWLX4lSFnczWwCMAQaYWRNwNdAdwN1/BtQBE4BGYBfwpXyFFZECcofVq0NBj8XgtdegXz/4/Oehtvb9Aj5oUBjmkKKSztkyF6fY78A/5SyRiESrqSkU8/nzwxkj3bvDZz4Dl14avvbsGXVCSUNk93MXkSKyYwfcdVco6MuWhV776NFw880wdWr4YFNKioq7SKVqaYGHHw4F/e67w/njQ4fC7NlwySVhyEVKloq7SKVZvRpuuy0MvWzZAocdBpddFoZdRo8umjNWJDsq7iKVwh1+8IPQM+/eHSZODAV9wgSNo5chFXeRStDSAt/4Bvzyl6Gg/+d/wuGHR51K8kjFXaTc7dwZLiB64AG48srQe9fQS9lTcRcpZ1u3huGXVavgllvg61+POpEUiIq7SLlqbIRx42DTpnA2zKRJUSeSAlJxFylDfdatgylTwsayZfDxj0cbSApO0+yJlJv77uNjl18ebsj1+OMq7BVKxV2knPz85/DZz7Lz2GNDYR8+POpEEhEVd5Fy4A7f/W74wHTcOFb/+MdQUxN1KomQirtIqdu7F770JfjhD+ErX4F772XfQQdFnUoipuIuUsp27AinOt52G1xzTbhIqVrnSYjOlhEpXZs3h1vwrlkDv/41fPnLUSeSIqLiLlKKnn8+nMP+xhtw330wfnzUiaTIqLiLlJo//SlckFRdDQ0NMHJk1ImkCGnMXaSUrFkD554bJs944gkVdumQeu4ipeRf/xUOOggeewwGDow6jRQxFXeRUrF0KSxZAjfcoMIuKWlYRqQUtLbCFVfAhz8M/6T56CU19dxFSsGiReG2vbfdBr16RZ1GSoB67iLFbs8euOoqOOkk+Id/iDqNlAj13EWK3c9/Dhs3Ql0dVFVFnUZKhHruIsVs+3aYMwfGjg0XLYmkScVdpJjdcEO4CvX66zXvqXSJirtIsXrtNbjxRpg6FU47Leo0UmJU3EWK1fe/Hz5M/eEPo04iJUjFXaQYvfBCuH3vP/4jDBsWdRopQSruIsXoyivDbQa+972ok0iJSqu4m9k4M1tvZo1mNjPJ/g+bWb2Z/cXM1pjZhNxHFakQy5fDnXfCd76jqfIkYymLu5lVAXOB8cAI4GIzG9Gu2XeBRe5+CjANuDnXQUUqgnu4zcDAgXD55VGnkRKWzkVMo4BGd98IYGYLgcnAuoQ2DvSNrx8KbMplSJGKUVcHjz4Kc+dCnz5Rp5ESlk5xPxp4NWG7CTi9XZtrgD+Y2TeBQ4Bzc5JOpJLs2wczZ4YPUL/2tajTSIkzd++8gdkU4NPu/tX49qXAKHf/ZkKby+OvdaOZjQZ+DXzU3VvbvdZ0YDpATU1N7cKFCzMK3dzcTO/evTN6biEoX3YqNd+HHnqIE66/nrVXX83rY8Zk9VqVegxzpZjzjR07dpW7p56lxd07XYDRwJKE7VnArHZt1gLHJGxvBAZ29rq1tbWeqfr6+oyfWwjKl52KzLdrl/ugQe6jRrm3tmb9chV5DHOomPMBKz1F3Xb3tM6WWQEMN7MhZtaD8IHp4nZtXgHOATCzvwF6Aa+n8doiAnDTTdDUpNsMSM6kLO7u3gLMAJYAzxHOillrZnPMbFK82beBr5nZamAB8MX4XxgRSeWtt+BHP4IJEyDL4RiRNmnd8tfd64C6do/NTlhfB5yZ22giFeK66+Cdd+Df/i3qJFJGdIWqSJReeQV++lP4whfg5JOjTiNlRMVdJEpXXx2+zpkTbQ4pOyruIlF55pkwJ+o3vxkmvhbJIRV3kajMnAmHHgqzZkWdRMqQ5lAViUJDQ7jVwPXXw+GHR51GypB67iKF1nZzsEGDwpCMSB6o5y5SaHfeCU89BfPmhXu2i+SBeu4ihbR3b5iI48QTw+mPInminrtIId1zD2zYEL5WVUWdRsqYeu4ihRSLwZFHwsSJUSeRMqfiLlIo27aFM2Quuki9dsk7FXeRQrnrLtizBz7/+aiTSAVQcRcplFgszLI0MvU8CyLZUnEXKYTNm2HZstBr1/3apQBU3EUKYdGicPHSxRdHnUQqhIq7SCHEYnDKKXDCCVEnkQqh4i6Sb42N4YpUfZAqBaTiLpJvCxaEcfZp06JOIhVExV0kn9zDkMwnPxluFCZSICruIvm0ejU8/7w+SJWCU3EXyadYDKqr4cILo04iFUbFXSRfWlvDePu4cdC/f9RppMKouIvky2OPQVOTzpKRSKi4i+TLggVw8MEwaVLUSaQCqbiL5MOePeGq1MmT4ZBDok4jFUjFXSQf/vhHeOstDclIZFTcRfIhFoPDD4fzzos6iVQoFXeRXNu5E+69F6ZMgR49ok4jFUrFXSTX7rsvFHhduCQRUnEXybVYDI4+Gj7xiaiTSAVTcRfJpTffhAcfDL32bvr1kuik9e4zs3Fmtt7MGs1sZgdtpprZOjNba2ax3MYUKRF33gktLTpLRiJXnaqBmVUBc4G/A5qAFWa22N3XJbQZDswCznT3t81sYL4CixS1BQvg+OPhYx+LOolUuHR67qOARnff6O57gIXA5HZtvgbMdfe3Adx9a25jipSApiZ45BHNkypFwdy98wZmFwLj3P2r8e1LgdPdfUZCm3uAF4AzgSrgGnd/KMlrTQemA9TU1NQuXLgwo9DNzc307t07o+cWgvJlp1TzDVq0iGG33MKT8+fzbsT3bi/VY1gsijnf2LFjV7n7yJQN3b3TBZgC/Cph+1Lgv9q1uR+4G+gODCEM3/Tr7HVra2s9U/X19Rk/txCULzslm+/UU91PO62gWTpSssewSBRzPmClp6jb7p7WsEwTcEzC9iBgU5I297r7Xnf/K7AeGJ7Ga4uUh/Xr4c9/1gepUjTSKe4rgOFmNsTMegDTgMXt2twDjAUwswHAccDGXAYVKWpt86ROnRp1EhEgjeLu7i3ADGAJ8BywyN3XmtkcM2u7l+kS4E0zWwfUA//P3d/MV2iRotI2T+rYsXDUUVGnEQHSOBUSwN3rgLp2j81OWHfg8vgiUllWrYING+CKK6JOIrKfLqETyVYsFm4Q9rnPRZ1EZD8Vd5Fs7NsHt98O48fDYYdFnUZkPxV3kWw8+ihs2qSzZKToqLiLZCMWg969YeLEqJOIHEDFXSRTu3fD738PF1wQJsIWKSIq7iKZWrIEtm3TkIwUJRV3kUzFYjBgAJxzTtRJRD5AxV0kEzt2wOLF4YrU7t2jTiPyASruIpm49154910NyUjRUnEXycSCBTB4MIweHXUSkaRU3EW6qPu2beHD1GnTNE+qFC29M0W66IhHHglXpmpIRoqYirtIFw1cuhROPBFOOinqKCIdUnEX6YpXXqHfM89onlQpeiruIl3RNu/vtGnR5hBJQcVdpCtiMd4ZMQKGDo06iUinVNxF0rV2LaxezVZdkSolQMVdJF0LFkC3bmwdMybqJCIpqbiLpMM9FPdzz2Xv4YdHnUYkJRV3kXQ89RRs3AgXXxx1EpG0qLiLpCMWg549w73bRUqAirtIKi0tYZ7UiRPh0EOjTiOSFhV3kVQaGmDLFt1uQEqKirtIKrEY9O0LEyZEnUQkbSruIp157z2480743OegV6+o04ikTcVdpDN1dbB9u4ZkpOSouIt0JhaDmhoYOzbqJCJdouIu0pHt2+H+++Gii6C6Ouo0Il2i4i7Skbvvht27deGSlCQVd5GOxGIwZAicfnrUSUS6LK3ibmbjzGy9mTWa2cxO2l1oZm5mI3MXUSQCW7bAww9rUg4pWSmLu5lVAXOB8cAI4GIzG5GkXR/g/wJP5jqkSMHdcQe0tuosGSlZ6fTcRwGN7r7R3fcAC4HJSdpdC/w78F4O84lEIxaDk0+GER/ox4iUhHSK+9HAqwnbTfHH9jOzU4Bj3P3+HGYTicbGjfDEE+q1S0lL5/yuZAOOvn+nWTfgx8AXU76Q2XRgOkBNTQ0NDQ1phWyvubk54+cWgvJlJ+p8H/7tbxkKPDF4MLuT5Ig6XzqKPaPyFYC7d7oAo4ElCduzgFkJ24cCbwAvxZf3gE3AyM5et7a21jNVX1+f8XMLQfmyE3m+E090P+usDndHni8NxZ5R+TIHrPQUddvd0xqWWQEMN7MhZtYDmAYsTvjj8I67D3D3Y939WGA5MMndV+bij49IQT3zTJgrVee2S4lLWdzdvQWYASwBngMWuftaM5tjZpPyHVCkoGIxqKqCKVOiTiKSlbSuqXb3OqCu3WOzO2g7JvtYIhFobQ3zpJ53HhxxRNRpRLKiK1RF2jzxBLz8ss6SkbKg4i7SZsECOOggmJzsMg6R0qLiLgKwdy8sWgTnnw99+kSdRiRrKu4iAEuXwuuva0hGyoaKuwiEs2T69YNx46JOIpITKu4iu3aFe7dfeCH07Bl1GpGcUHEXeeABaG7WhUtSVlTcRWIxOPJIOPvsqJOI5IyKu1S2t9+GujqYNi1cmSpSJlTcpbLddRfs2aOzZKTsqLhLZVuwAIYNg9raqJOI5JSKu1SuzZth2TLNkyplScVdKtftt4O7zpKRsqTiLpUrFoNTT4UTTog6iUjOqbhLZdqwAVas0AepUrZU3KUyLVwYxtkvuijqJCJ5oeIulccdfvc7+OQnYdCgqNOI5IWKu1Sep5+G9es1JCNlTcVdKk8sBt27w9//fdRJRPJGxV0qS2trGG//9Kehf/+o04jkjYq7VJaHH4amJg3JSNlTcZfK4Q5XXQXHHAMXXBB1GpG8qo46gEjB3HEHrFwJt94KvXpFnUYkr9Rzl8qwdy9ceSWcdBJccknUaUTyTj13qQy/+AW8+GKYdUn3bZcKoJ67lL8dO2DOnDDT0vjxUacRKQj13KX83XgjbN0K992nW/tKxVDPXcrbli1www1w4YUwalTUaUQKRsVdytucObB7N/zoR1EnESkoFXcpXxs2hA9Sp0+H4cOjTiNSUCruUr6uugp69oTZs6NOIlJwaRV3MxtnZuvNrNHMZibZf7mZrTOzNWa21MwG5z6qSBc89VS4aOk734GamqjTiBRcyuJuZlXAXGA8MAK42MxGtGv2F2Cku58M/B7491wHFUmbO1xxBQwcCN/+dtRpRCKRTs99FNDo7hvdfQ+wEJic2MDd6919V3xzOaAZECQ6Dz0EDQ1hOKZPn6jTiETC3L3zBmYXAuPc/avx7UuB0919RgftbwJec/cfJNk3HZgOUFNTU7tw4cKMQjc3N9O7d++MnlsIypedrPLt28fI6dOpeu89nrr1Vrx799yGo/iPHxR/RuXL3NixY1e5+8iUDd290wWYAvwqYftS4L86aHsJoefeM9Xr1tbWeqbq6+szfm4hKF92ssp3663u4H777TnL016xHz/34s+ofJkDVnqK+uruaV2h2gQck7A9CNjUvpGZnQtcBZzt7rvTeF2R3HrvPfje92DkyHDRkkgFS6e4rwCGm9kQ4H+AacABMx2Y2SnAzwnDN1tznlIkHTfdBK++CrfdBt10lq9UtpS/Ae7eAswAlgDPAYvcfa2ZzTGzSfFm/wH0Bu4ws6fNbHHeEosk8/bb4SrUceNg7Nio04hELq0bh7l7HVDX7rHZCevn5jiXSNdcdx1s2xa+ioiuUJUy8Oqr8JOfhEk4/vZvo04jUhRU3KX0XX11uHDp2mujTiJSNFTcpbQ9+2z4AHXGDBisu16ItFFxl9I2a1a4CvXKK6NOIlJUVNyldD36KNx/P8ycCf37R51GpKiouEtpars52NFHw7e+FXUakaKjOVSlNN19NyxfDr/6FRx0UNRpRIqOeu5SevbuDWPtI0bAZZdFnUakKKnnLqVn3jx44QW4916o1ltYJBn13KW0NDfDNdfAWWfB+edHnUakaKnbI6XjjTdg0iTYsgXuugvMok4kUrRU3KU0bNwI48fDyy+HuVFHj446kUhRU3GX4rdqFUyYED5IXboUzjwz6kQiRU9j7lLcHnwQzj47nO74+OMq7CJpUnGX4jVvXvjQ9Ljj4Ikn4IQTok4kUjJU3KX4uMP3vw9f+Qqccw488ggceWTUqURKisbcpbi0tHDcjTfCAw+EC5R++Uvo3j3qVCIlRz13KR7NzTB5Mkc98AB897vw3/+twi6SIRV3KQ5btoS5Tx96iPX/8i9h4g2dxy6SMQ3LSPReeCGcw755M9xzD5v79OH4qDOJlDj13CVay5fDGWfA9u3Q0KBbCojkiIq7RGfxYvjUp6Bfv3Cq46hRUScSKRsq7hKNW26BCy6Aj340XJw0bFjUiUTKioq7FFZLS5jv9BvfCLcUqK+HgQOjTiVSdvSBquSfOzz9NMyfDwsWwGuvwfTpMHeu7scukif6zZL8aWqCWCwU9WefDeesf+Yz8MUvhlv36lRHkbxRcZfc2rEj3Gt9/nxYtiz02kePhptvhqlToX//qBOKVAQVd8leSwv88Y/w29+GiavffReGDoXZs+GSS/RhqUgEVNwlM+7wl7+8P46+ZQscdli4H8yll4beuoZdRCKj4i7p2bcPXn0VGhthxYrQS1+3LoyjT5wYCvqECdCzZ9RJRYQ0i7uZjQN+AlQBv3L369rt7wn8BqgF3gQucveXchtV8m7PHnjppVDAGxvhxRffX//rX8NMSG3OOCOcqz51Khx+eGSRRSS5lMXdzKqAucDfAU3ACjNb7O7rEpp9BXjb3YeZ2TTgeuCifASWDLW2hrsu7tjBIRs3wrZtHyzgr7wS2rXp3TuMl590UrjgaNgw+MhH4Pjj4aijovu3iEhK6fTcRwGN7r4RwMwWApOBxOI+Gbgmvv574CYzM3f3HGYtD+6hgO7de+DS0vLBxzpa9uwJZ6Vs3x6+prPe3Lw/wmmJefr3DwX7jDPgC18I621FfOBAjZuLlKh0ivvRwKsJ203A6R21cfcWM3sH6A+8kYuQB5g3j9PmzIGDDw7b7f9+JPt7kqxN22Op1jva19oalsT1+HJWS0soiomPt7XLx9+7Hj2gb1/o0ycsffvCEUeEM1baHk/Yv3bTJk6cODEU8MMOy30eEYlcOsU9WdetfYVKpw1mNh2YDlBTU0NDQ0Ma3/5A/Tdvpv+gQexMvLKxfe8ySW/Tk/VA2x4zO3B/Z4/Ht71bt/f3d+t2wNc9LS1079kz7O8Wv8NDuzZeXY1XV9NaVYVXVe3f3v9YZ9vV1ew7+GD2HXwwLQcdhPfo0aVj2HzUUbze3AyrV3fpeYXS3Nyc0XujUIo9HxR/RuUrAHfvdAFGA0sStmcBs9q1WQKMjq9XE3rs1tnr1tbWeqbq6+szfm4hKF92lC97xZ5R+TIHrPQUddvd07px2ApguJkNMbMewDRgcbs2i4HL4usXAsviIUREJAIph2U8jKHPIPTOq4B57r7WzOYQ/oIsBn4NzDezRuAtwh8AERGJSFrnubt7HVDX7rHZCevvAVNyG01ERDKl+7mLiJQhFXcRkTKk4i4iUoZU3EVEypCKu4hIGbKoTkc3s9eBlzN8+gDycWuD3FG+7Chf9oo9o/JlbrC7H5GqUWTFPRtmttLdR0adoyPKlx3ly16xZ1S+/NOwjIhIGVJxFxEpQ6Va3H8RdYAUlC87ype9Ys+ofHlWkmPuIiLSuVLtuYuISCeKtrib2RQzW2tmrWY2st2+WWbWaGbrzezTHTx/iJk9aWYbzOz2+O2K85X1djN7Or68ZGZPd9DuJTN7Jt5uZb7yJPm+15jZ/yRknNBBu3HxY9poZjMLmO8/zOx5M1tjZnebWb8O2hX0+KU6HmbWM/6zb4y/147Nd6aE732MmdWb2XPx35NvJWkzxszeSfi5z072WnnM2OnPy4Kfxo/fGjM7tYDZjk84Lk+b2XYz++d2bSI9fllL56bvUSzA3wDHAw3AyITHRwCrgZ7AEOBFoCrJ8xcB0+LrPwP+T4Fy3wjM7mDfS8CACI7lNcB3UrSpih/LoUCP+DEeUaB85wHV8fXrgeujPn7pHA/gG8DP4uvTgNsL+DM9Ejg1vt4HeCFJvjHA/YV+v6X78wImAA8SZnL7OPBkRDmrgNcI548XzfHLdinanru7P+fu65PsmgwsdPfd7v5XoJEwifd+ZmbApwiTdQPcBnw2n3kTvu9UYEG+v1ce7J8I3d33AG0Toeedu//B3Vvim8uBQYX4vimkczwmE95bEN5r58TfA3nn7pvd/c/x9R3Ac4S5jEvJZOA3HiwH+pnZkRHkOAd40d0zvaiyKBVtce9Esgm727+p+wPbEgpGsjb58Algi7tv6GC/A38ws1Xx+WQLaUb8v77zzCzZrNjpHNdC+DKhN5dMIY9fOsfjgInhgbaJ4QsqPhx0CvBkkt2jzWy1mT1oZicWNFjqn1exvOem0XGHLMrjl5W0JuvIFzN7GPhQkl1Xufu9HT0tyWMZTdjdFWlmvZjOe+1nuvsmMxsI/NHMnnf3R7PJlU4+4BbgWsIxuJYwdPTl9i+R5Lk5O5UqneNnZlcBLcDvOniZvB2/JCJ5n3WVmfUG7gT+2d23t9v9Z8JQQ3P8c5Z7gOEFjJfq51UMx68HMIkwN3R7UR+/rERa3N393Aye1gQck7A9CNjUrs0bhP/iVcd7VMnadEmqrGZWDXwOqO3kNTbFv241s7sJ//XPSXFK91ia2S+B+5PsSue4ZiyN43cZMBE4x+MDnkleI2/HL4l0jkdbm6b4z/9QwjSTBWFm3QmF/Xfuflf7/YnF3t3rzOxmMxvg7gW5Z0oaP6+8vufSNB74s7tvab8j6uOXrVIcllkMTIufqTCE8Jf0qcQG8eJQT5isG8Lk3R39TyBXzgWed/emZDvN7BAz69O2TvgQ8dk8Z2r73onjmBd08H3TmQg9X/nGAVcAk9x9VwdtCn38inpi+PjY/q+B59z9/3fQ5kNtnwGY2SjC7/ubBcqXzs9rMfCF+FkzHwfecffNhciXoMP/bUd5/HIi6k90O1oIRagJ2A1sAZYk7LuKcCbDemB8wuN1wFHx9aGEot8I3AH0zHPeW4Gvt3vsKKAuIc/q+LKWMBxRqGM5H3gGWEP4hTqyfb749gTCWRcvFjhfI2Hs9en48rP2+aI4fsmOBzCH8EcIoFf8vdUYf68NLeAxO4swhLEm4bhNAL7e9j4EZsSP1WrCB9VnFDBf0p9Xu3wGzI0f32dIOCuuQBkPJhTrQxMeK4rjl4tFV6iKiJShUhyWERGRFFTcRUTKkIq7iEgZUnEXESlDKu4iImVIxV1EpAypuIuIlCEVdxGRMvS/Tq7yTBjr6swAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "xx = np.arange(-10,10,step=1)\n",
    "yy = sigmoid(xx)\n",
    "plt.grid()\n",
    "plt.plot(xx, yy, 'r')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "def logistic_model(X, theta):\n",
    "    temp = np.dot(X,theta.T)\n",
    "    return sigmoid(temp)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "diabetes_data.insert(0,'Ones',1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Ones</th>\n",
       "      <th>Pregnancies</th>\n",
       "      <th>Glucose</th>\n",
       "      <th>BloodPressure</th>\n",
       "      <th>SkinThickness</th>\n",
       "      <th>Insulin</th>\n",
       "      <th>BMI</th>\n",
       "      <th>DiabetesPedigreeFunction</th>\n",
       "      <th>Age</th>\n",
       "      <th>Outcome</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>6</td>\n",
       "      <td>148</td>\n",
       "      <td>72</td>\n",
       "      <td>35</td>\n",
       "      <td>0</td>\n",
       "      <td>33.6</td>\n",
       "      <td>0.627</td>\n",
       "      <td>50</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>85</td>\n",
       "      <td>66</td>\n",
       "      <td>29</td>\n",
       "      <td>0</td>\n",
       "      <td>26.6</td>\n",
       "      <td>0.351</td>\n",
       "      <td>31</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>8</td>\n",
       "      <td>183</td>\n",
       "      <td>64</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>23.3</td>\n",
       "      <td>0.672</td>\n",
       "      <td>32</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>89</td>\n",
       "      <td>66</td>\n",
       "      <td>23</td>\n",
       "      <td>94</td>\n",
       "      <td>28.1</td>\n",
       "      <td>0.167</td>\n",
       "      <td>21</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>137</td>\n",
       "      <td>40</td>\n",
       "      <td>35</td>\n",
       "      <td>168</td>\n",
       "      <td>43.1</td>\n",
       "      <td>2.288</td>\n",
       "      <td>33</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Ones  Pregnancies  Glucose  BloodPressure  SkinThickness  Insulin   BMI  \\\n",
       "0     1            6      148             72             35        0  33.6   \n",
       "1     1            1       85             66             29        0  26.6   \n",
       "2     1            8      183             64              0        0  23.3   \n",
       "3     1            1       89             66             23       94  28.1   \n",
       "4     1            0      137             40             35      168  43.1   \n",
       "\n",
       "   DiabetesPedigreeFunction  Age  Outcome  \n",
       "0                     0.627   50        1  \n",
       "1                     0.351   31        0  \n",
       "2                     0.672   32        1  \n",
       "3                     0.167   21        0  \n",
       "4                     2.288   33        1  "
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "diabetes_data.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "orig_data = diabetes_data.values\n",
    "cols = orig_data.shape[1]\n",
    "X = orig_data[:,0:cols-1]    #X大写,表示是一个矩阵\n",
    "y = orig_data[:,cols-1:cols] #y小写,表示矢量\n",
    "theta = np.zeros([1,cols-1]) #theta设为行向量"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[0., 0., 0., 0., 0., 0., 0., 0., 0.]])"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "theta"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "def cost(X, y, theta):\n",
    "    item1 = np.multiply(y, np.log(logistic_model(X,theta))) \n",
    "    item2 = np.multiply(1-y, np.log(1 - logistic_model(X,theta))) \n",
    "    return np.sum(item1 - item2) / (len(X))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.20938821079415015"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cost(X, y, theta)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "def gradient(X, y, theta):\n",
    "    grad = np.zeros(theta.shape) #一个梯度是对theta求导的\n",
    "    error = (logistic_model(X,theta) - y).ravel()\n",
    "    for j in range(len(theta.ravel())):\n",
    "        temp = np.multiply(error, X[:,j])\n",
    "        grad[0,j] = np.sum(temp) / len(X)\n",
    "    return grad"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "#拟合 fit,求模型的参数,也称为训练的过程,\n",
    "def fit(X, y, theta, iter_num = 5000, alpha=0.00001):\n",
    "    #梯度下降求解\n",
    "    i = 0 # 迭代次数\n",
    "    grad = np.zeros(theta.shape) # 计算的梯度\n",
    "    costs = [cost(X, y, theta)] # 损失值\n",
    "    while True:\n",
    "        grad = gradient(X, y, theta)\n",
    "        theta = theta - alpha*grad # 参数更新\n",
    "        costs.append(cost(X, y, theta)) # 计算新的损失\n",
    "        i += 1 \n",
    "        if i % (iter_num / 10) == 0: print(costs[i])\n",
    "        if i > iter_num: break\n",
    "    \n",
    "    return theta"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "D:\\Anaconda\\lib\\site-packages\\ipykernel_launcher.py:3: RuntimeWarning: divide by zero encountered in log\n",
      "  This is separate from the ipykernel package so we can avoid doing imports until\n",
      "D:\\Anaconda\\lib\\site-packages\\ipykernel_launcher.py:3: RuntimeWarning: invalid value encountered in multiply\n",
      "  This is separate from the ipykernel package so we can avoid doing imports until\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-5.511409235893268\n",
      "-5.31859458354884\n",
      "-5.063153190867181\n",
      "-4.696751678117883\n",
      "-4.074011252701483\n",
      "-3.902875016698084\n",
      "-3.744762960211906\n",
      "-3.601077279719243\n",
      "-3.4711575061505564\n",
      "-3.352062637279824\n"
     ]
    }
   ],
   "source": [
    "# 调参,只能根据经验来,炼丹\n",
    "theta = fit(X, y, theta,iter_num = 500000, alpha=0.0015)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "D:\\Anaconda\\lib\\site-packages\\sklearn\\model_selection\\_split.py:2026: FutureWarning: From version 0.21, test_size will always complement train_size unless both are specified.\n",
      "  FutureWarning)\n"
     ]
    }
   ],
   "source": [
    "from sklearn.model_selection import train_test_split\n",
    "X_train, X_test, y_train, y_test = train_test_split(X, y, train_size = .8)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(614, 9)"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "X_train.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "theta = np.zeros([1,cols-1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "D:\\Anaconda\\lib\\site-packages\\ipykernel_launcher.py:3: RuntimeWarning: divide by zero encountered in log\n",
      "  This is separate from the ipykernel package so we can avoid doing imports until\n",
      "D:\\Anaconda\\lib\\site-packages\\ipykernel_launcher.py:3: RuntimeWarning: invalid value encountered in multiply\n",
      "  This is separate from the ipykernel package so we can avoid doing imports until\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-3.4953304853973584\n",
      "-4.075793679628199\n",
      "-3.7134641993740907\n",
      "-3.402073232763518\n",
      "-3.155158733286961\n",
      "-2.9550791865014996\n",
      "-2.785268118118423\n",
      "-2.6323045981679933\n",
      "-2.4989764065989086\n",
      "-2.3919272008733246\n"
     ]
    }
   ],
   "source": [
    "theta = fit(X_train, y_train, theta,iter_num = 1000000, alpha=0.0015)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 测试过程\n",
    "def predict(X,theta, threshold = 0.5):\n",
    "    p = logistic_model(X, theta)\n",
    "    #分类,如果这个概率大于0.5,分类为1,否则为0\n",
    "    y = np.where(p > threshold, 1, 0)\n",
    "    return y"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "# shift + enter\n",
    "myPredict_y = predict(X_test, theta, threshold = 0.5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>0</th>\n",
       "      <th>MyPredict</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>124</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>125</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>126</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>127</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>128</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>129</th>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>130</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>131</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>132</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>133</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>134</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>135</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>136</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>137</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>138</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>139</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>140</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>141</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>142</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>143</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>144</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>145</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>146</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>147</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>148</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>149</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>150</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>151</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>152</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>153</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>154 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       0  MyPredict\n",
       "0    0.0          0\n",
       "1    1.0          1\n",
       "2    1.0          1\n",
       "3    0.0          0\n",
       "4    0.0          0\n",
       "5    0.0          1\n",
       "6    1.0          1\n",
       "7    1.0          1\n",
       "8    0.0          0\n",
       "9    1.0          1\n",
       "10   0.0          0\n",
       "11   0.0          1\n",
       "12   0.0          0\n",
       "13   1.0          1\n",
       "14   0.0          1\n",
       "15   0.0          1\n",
       "16   0.0          0\n",
       "17   0.0          0\n",
       "18   0.0          1\n",
       "19   1.0          1\n",
       "20   0.0          1\n",
       "21   1.0          1\n",
       "22   0.0          0\n",
       "23   0.0          1\n",
       "24   0.0          1\n",
       "25   0.0          0\n",
       "26   0.0          0\n",
       "27   1.0          1\n",
       "28   1.0          1\n",
       "29   0.0          0\n",
       "..   ...        ...\n",
       "124  1.0          1\n",
       "125  1.0          1\n",
       "126  1.0          1\n",
       "127  1.0          1\n",
       "128  0.0          1\n",
       "129  1.0          0\n",
       "130  0.0          1\n",
       "131  0.0          0\n",
       "132  1.0          1\n",
       "133  0.0          1\n",
       "134  0.0          1\n",
       "135  1.0          1\n",
       "136  1.0          1\n",
       "137  1.0          1\n",
       "138  0.0          0\n",
       "139  0.0          1\n",
       "140  0.0          0\n",
       "141  0.0          0\n",
       "142  0.0          1\n",
       "143  0.0          1\n",
       "144  0.0          0\n",
       "145  0.0          0\n",
       "146  0.0          0\n",
       "147  0.0          0\n",
       "148  0.0          0\n",
       "149  0.0          0\n",
       "150  0.0          1\n",
       "151  1.0          1\n",
       "152  0.0          1\n",
       "153  0.0          1\n",
       "\n",
       "[154 rows x 2 columns]"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 要看预测的值和真实值y_test之间的差别\n",
    "yy = pd.DataFrame(y_test)\n",
    "yy[\"MyPredict\"] = myPredict_y\n",
    "yy\n",
    "#20个数据对了16个, 80%准确率"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "D:\\Anaconda\\lib\\site-packages\\sklearn\\utils\\validation.py:578: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n",
      "  y = column_or_1d(y, warn=True)\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,\n",
       "          intercept_scaling=1, max_iter=100, multi_class='ovr', n_jobs=1,\n",
       "          penalty='l2', random_state=None, solver='liblinear', tol=0.0001,\n",
       "          verbose=0, warm_start=False)"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 看sklearn的函数的表现\n",
    "from sklearn.linear_model import LogisticRegression\n",
    "\n",
    "lr = LogisticRegression()\n",
    "\n",
    "lr.fit(X_train, y_train)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [],
   "source": [
    "lr_predict = lr.predict(X_test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([0., 0., 1., 0., 0., 0., 0., 1., 0., 1., 0., 0., 0., 1., 0., 0., 0.,\n",
       "       0., 1., 1., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 1., 0., 0., 1.,\n",
       "       0., 0., 1., 0., 0., 0., 1., 0., 0., 1., 0., 0., 0., 0., 0., 0., 0.,\n",
       "       0., 1., 0., 1., 0., 0., 0., 1., 0., 0., 0., 1., 0., 1., 0., 0., 0.,\n",
       "       0., 0., 0., 0., 0., 0., 1., 0., 1., 0., 0., 0., 0., 0., 1., 0., 0.,\n",
       "       0., 1., 0., 1., 1., 0., 0., 1., 0., 0., 0., 0., 0., 1., 1., 0., 1.,\n",
       "       0., 1., 0., 0., 1., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.,\n",
       "       0., 0., 0., 1., 0., 0., 0., 0., 0., 0., 0., 1., 0., 0., 0., 0., 1.,\n",
       "       0., 0., 0., 1., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 1., 1., 0.,\n",
       "       1.])"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "lr_predict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>0</th>\n",
       "      <th>MyPredict</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>124</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>125</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>126</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>127</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>128</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>129</th>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>130</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>131</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>132</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>133</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>134</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>135</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>136</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>137</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>138</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>139</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>140</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>141</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>142</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>143</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>144</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>145</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>146</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>147</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>148</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>149</th>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>150</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>151</th>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>152</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>153</th>\n",
       "      <td>0.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>154 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       0  MyPredict\n",
       "0    0.0          0\n",
       "1    1.0          1\n",
       "2    1.0          1\n",
       "3    0.0          0\n",
       "4    0.0          0\n",
       "5    0.0          1\n",
       "6    1.0          1\n",
       "7    1.0          1\n",
       "8    0.0          0\n",
       "9    1.0          1\n",
       "10   0.0          0\n",
       "11   0.0          1\n",
       "12   0.0          0\n",
       "13   1.0          1\n",
       "14   0.0          1\n",
       "15   0.0          1\n",
       "16   0.0          0\n",
       "17   0.0          0\n",
       "18   0.0          1\n",
       "19   1.0          1\n",
       "20   0.0          1\n",
       "21   1.0          1\n",
       "22   0.0          0\n",
       "23   0.0          1\n",
       "24   0.0          1\n",
       "25   0.0          0\n",
       "26   0.0          0\n",
       "27   1.0          1\n",
       "28   1.0          1\n",
       "29   0.0          0\n",
       "..   ...        ...\n",
       "124  1.0          1\n",
       "125  1.0          1\n",
       "126  1.0          1\n",
       "127  1.0          1\n",
       "128  0.0          1\n",
       "129  1.0          0\n",
       "130  0.0          1\n",
       "131  0.0          0\n",
       "132  1.0          1\n",
       "133  0.0          1\n",
       "134  0.0          1\n",
       "135  1.0          1\n",
       "136  1.0          1\n",
       "137  1.0          1\n",
       "138  0.0          0\n",
       "139  0.0          1\n",
       "140  0.0          0\n",
       "141  0.0          0\n",
       "142  0.0          1\n",
       "143  0.0          1\n",
       "144  0.0          0\n",
       "145  0.0          0\n",
       "146  0.0          0\n",
       "147  0.0          0\n",
       "148  0.0          0\n",
       "149  0.0          0\n",
       "150  0.0          1\n",
       "151  1.0          1\n",
       "152  0.0          1\n",
       "153  0.0          1\n",
       "\n",
       "[154 rows x 2 columns]"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "yy"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值