630 lines
66 KiB
Plaintext
630 lines
66 KiB
Plaintext
{
|
||
"cells": [
|
||
{
|
||
"cell_type": "code",
|
||
"execution_count": 2,
|
||
"metadata": {},
|
||
"outputs": [
|
||
{
|
||
"data": {
|
||
"text/html": [
|
||
"<div>\n",
|
||
"<style scoped>\n",
|
||
" .dataframe tbody tr th:only-of-type {\n",
|
||
" vertical-align: middle;\n",
|
||
" }\n",
|
||
"\n",
|
||
" .dataframe tbody tr th {\n",
|
||
" vertical-align: top;\n",
|
||
" }\n",
|
||
"\n",
|
||
" .dataframe thead th {\n",
|
||
" text-align: right;\n",
|
||
" }\n",
|
||
"</style>\n",
|
||
"<table border=\"1\" class=\"dataframe\">\n",
|
||
" <thead>\n",
|
||
" <tr style=\"text-align: right;\">\n",
|
||
" <th></th>\n",
|
||
" <th>0</th>\n",
|
||
" <th>1</th>\n",
|
||
" <th>2</th>\n",
|
||
" <th>3</th>\n",
|
||
" <th>4</th>\n",
|
||
" <th>0.1</th>\n",
|
||
" <th>1.1</th>\n",
|
||
" <th>2.1</th>\n",
|
||
" <th>3.1</th>\n",
|
||
" <th>4.1</th>\n",
|
||
" <th>0.2</th>\n",
|
||
" <th>1.2</th>\n",
|
||
" <th>2.2</th>\n",
|
||
" <th>3.2</th>\n",
|
||
" <th>4.2</th>\n",
|
||
" <th>label</th>\n",
|
||
" </tr>\n",
|
||
" </thead>\n",
|
||
" <tbody>\n",
|
||
" <tr>\n",
|
||
" <th>0</th>\n",
|
||
" <td>0.715031</td>\n",
|
||
" <td>0.608764</td>\n",
|
||
" <td>0.631124</td>\n",
|
||
" <td>0.650236</td>\n",
|
||
" <td>0.512070</td>\n",
|
||
" <td>0.277071</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.125949</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.003074</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>hupu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>1</th>\n",
|
||
" <td>0.662252</td>\n",
|
||
" <td>0.541335</td>\n",
|
||
" <td>0.570617</td>\n",
|
||
" <td>0.584465</td>\n",
|
||
" <td>0.433609</td>\n",
|
||
" <td>0.451821</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.106180</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>hupu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>2</th>\n",
|
||
" <td>0.894304</td>\n",
|
||
" <td>0.861196</td>\n",
|
||
" <td>0.824562</td>\n",
|
||
" <td>0.870190</td>\n",
|
||
" <td>0.850370</td>\n",
|
||
" <td>0.414012</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.047087</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.033857</td>\n",
|
||
" <td>hupu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>3</th>\n",
|
||
" <td>0.743064</td>\n",
|
||
" <td>0.612346</td>\n",
|
||
" <td>0.575538</td>\n",
|
||
" <td>0.649530</td>\n",
|
||
" <td>0.692186</td>\n",
|
||
" <td>0.158237</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.032681</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.031898</td>\n",
|
||
" <td>hupu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>4</th>\n",
|
||
" <td>0.667459</td>\n",
|
||
" <td>0.508679</td>\n",
|
||
" <td>0.472092</td>\n",
|
||
" <td>0.547407</td>\n",
|
||
" <td>0.598427</td>\n",
|
||
" <td>0.375792</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.184405</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.112612</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.027564</td>\n",
|
||
" <td>hupu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>...</th>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" <td>...</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>1596</th>\n",
|
||
" <td>0.809034</td>\n",
|
||
" <td>0.709333</td>\n",
|
||
" <td>0.673414</td>\n",
|
||
" <td>0.743852</td>\n",
|
||
" <td>0.776838</td>\n",
|
||
" <td>0.046705</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.049131</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.027310</td>\n",
|
||
" <td>zhihu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>1597</th>\n",
|
||
" <td>0.911794</td>\n",
|
||
" <td>0.816672</td>\n",
|
||
" <td>0.847797</td>\n",
|
||
" <td>0.946110</td>\n",
|
||
" <td>0.986384</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.057710</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.029776</td>\n",
|
||
" <td>zhihu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>1598</th>\n",
|
||
" <td>0.965672</td>\n",
|
||
" <td>0.957016</td>\n",
|
||
" <td>0.934561</td>\n",
|
||
" <td>0.991138</td>\n",
|
||
" <td>0.995043</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.097930</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.045403</td>\n",
|
||
" <td>zhihu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>1599</th>\n",
|
||
" <td>0.961447</td>\n",
|
||
" <td>0.945493</td>\n",
|
||
" <td>0.927631</td>\n",
|
||
" <td>0.987624</td>\n",
|
||
" <td>0.994379</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.084861</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.066429</td>\n",
|
||
" <td>zhihu</td>\n",
|
||
" </tr>\n",
|
||
" <tr>\n",
|
||
" <th>1600</th>\n",
|
||
" <td>0.969485</td>\n",
|
||
" <td>0.967490</td>\n",
|
||
" <td>0.940832</td>\n",
|
||
" <td>0.994306</td>\n",
|
||
" <td>0.995641</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.000000</td>\n",
|
||
" <td>0.0</td>\n",
|
||
" <td>0.117410</td>\n",
|
||
" <td>zhihu</td>\n",
|
||
" </tr>\n",
|
||
" </tbody>\n",
|
||
"</table>\n",
|
||
"<p>4670 rows × 16 columns</p>\n",
|
||
"</div>"
|
||
],
|
||
"text/plain": [
|
||
" 0 1 2 3 4 0.1 1.1 2.1 3.1 4.1 0.2 1.2 2.2 3.2 4.2 label\n",
|
||
"0 0.715031 0.608764 0.631124 0.650236 0.512070 0.277071 0.0 0.0 0.000000 0.000000 0.125949 0.0 0.003074 0.0 0.000000 hupu\n",
|
||
"1 0.662252 0.541335 0.570617 0.584465 0.433609 0.451821 0.0 0.0 0.000000 0.000000 0.106180 0.0 0.000000 0.0 0.000000 hupu\n",
|
||
"2 0.894304 0.861196 0.824562 0.870190 0.850370 0.414012 0.0 0.0 0.000000 0.000000 0.047087 0.0 0.000000 0.0 0.033857 hupu\n",
|
||
"3 0.743064 0.612346 0.575538 0.649530 0.692186 0.158237 0.0 0.0 0.000000 0.000000 0.032681 0.0 0.000000 0.0 0.031898 hupu\n",
|
||
"4 0.667459 0.508679 0.472092 0.547407 0.598427 0.375792 0.0 0.0 0.184405 0.000000 0.112612 0.0 0.000000 0.0 0.027564 hupu\n",
|
||
"... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...\n",
|
||
"1596 0.809034 0.709333 0.673414 0.743852 0.776838 0.046705 0.0 0.0 0.000000 0.049131 0.000000 0.0 0.000000 0.0 0.027310 zhihu\n",
|
||
"1597 0.911794 0.816672 0.847797 0.946110 0.986384 0.000000 0.0 0.0 0.000000 0.057710 0.000000 0.0 0.000000 0.0 0.029776 zhihu\n",
|
||
"1598 0.965672 0.957016 0.934561 0.991138 0.995043 0.000000 0.0 0.0 0.000000 0.097930 0.000000 0.0 0.000000 0.0 0.045403 zhihu\n",
|
||
"1599 0.961447 0.945493 0.927631 0.987624 0.994379 0.000000 0.0 0.0 0.000000 0.084861 0.000000 0.0 0.000000 0.0 0.066429 zhihu\n",
|
||
"1600 0.969485 0.967490 0.940832 0.994306 0.995641 0.000000 0.0 0.0 0.000000 0.000000 0.000000 0.0 0.000000 0.0 0.117410 zhihu\n",
|
||
"\n",
|
||
"[4670 rows x 16 columns]"
|
||
]
|
||
},
|
||
"execution_count": 2,
|
||
"metadata": {},
|
||
"output_type": "execute_result"
|
||
}
|
||
],
|
||
"source": [
|
||
"import pandas as pd\n",
|
||
"import numpy as np\n",
|
||
"train_path = '../datasets/2019-12-21/train.csv'\n",
|
||
"test_path = '../datasets/2019-12-21/test.csv'\n",
|
||
"train_df = pd.read_csv(train_path,index_col=0)\n",
|
||
"test_df = pd.read_csv(test_path,index_col=0)\n",
|
||
"test_df"
|
||
]
|
||
},
|
||
{
|
||
"cell_type": "code",
|
||
"execution_count": 3,
|
||
"metadata": {
|
||
"collapsed": true
|
||
},
|
||
"outputs": [],
|
||
"source": [
|
||
"from sklearn.linear_model import LogisticRegression\n",
|
||
"from sklearn.svm import SVC\n",
|
||
"from sklearn.naive_bayes import GaussianNB\n",
|
||
"from sklearn import tree\n",
|
||
"from sklearn.ensemble import RandomForestClassifier\n",
|
||
"from sklearn.metrics import f1_score,recall_score,precision_score"
|
||
]
|
||
},
|
||
{
|
||
"cell_type": "code",
|
||
"execution_count": 14,
|
||
"metadata": {},
|
||
"outputs": [
|
||
{
|
||
"name": "stderr",
|
||
"output_type": "stream",
|
||
"text": [
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\linear_model\\logistic.py:430: FutureWarning: Default solver will be changed to 'lbfgs' in 0.22. Specify a solver to silence this warning.\n",
|
||
" warnings.warn(\"Default solver will be changed to 'lbfgs' in 0.22. \"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\linear_model\\logistic.py:467: FutureWarning: Default multi_class will be changed to 'auto' in 0.22. Specify the multi_class option to silence this warning.\n",
|
||
" warnings.warn(\"Default multi_class will be changed to 'auto' in\"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\svm\\base.py:189: FutureWarning: The default value of gamma will change from 'auto' to 'scale' in version 0.22 to account better for unscaled features. Set gamma explicitly to 'auto' or 'scale' to avoid this warning.\n",
|
||
" warnings.warn(\"The default value of gamma will change \"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\ensemble\\forest.py:244: FutureWarning: The default value of n_estimators will change from 10 in version 0.20 to 100 in 0.22.\n",
|
||
" warn(\"The default value of n_estimators will change from \"\n"
|
||
]
|
||
},
|
||
{
|
||
"name": "stdout",
|
||
"output_type": "stream",
|
||
"text": [
|
||
"precision 0.801927\n",
|
||
"recall 0.801927\n",
|
||
"f1 0.801927\n",
|
||
"Name: RandomForest, dtype: float64\n"
|
||
]
|
||
},
|
||
{
|
||
"data": {
|
||
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAXQAAAFcCAYAAADYnEUIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8li6FKAAAgAElEQVR4nO3debxVdb3/8debI4gDasmxlEFQyTFFBdRrEuk1h1+JUldBDdOUUMzMHLDpVuZVr2V6UyM0cUgkzSFUUsvEIYcARRTURAQ5agmYA4gyfX5/rHVksznDBs45a7PW+/l4nId7rfVlnc/Zwvus/V3f9f0qIjAzs/Vfu6wLMDOzluFANzPLCQe6mVlOONDNzHLCgW5mlhMOdDOznHCgm7USSbMl/WfWdVhxONAtUw49s5bjQDdrYZI2yLoGKyYHumVG0k1Ad+BuSQslnSvpXknfKms3TdKR6euQdIakWZLmS7pUUruStidJekHSvyXdL2nbRr53j/RcJ0qam7YfLqlv+v3ekXRlSfvtJf1V0oL0+94saYuS47MlnSdpGrCoPNQl7STpVUmD0+2dJU1Mv890SUek+/eV9E9JNSV/9qj0vGZNiwh/+SuzL2A28J8l20cDT5Vs7wEsADqk2wE8BHyS5JfBP4CT02NHAjOBnYENgB8AjzfyfXuk5xoFdAS+CHwI3AVsBXQB3gI+n7bfATgY2BCoBR4BLi/7OaYC3YCNSn82YC/gNeBL6f72aZ3fAzoABwLvAzumx18BDi45923AyKz/X/mr+r98hW7V5o9AL0m90u2vAb+PiCUlbS6JiLcj4jXgcmBIuv+bwEUR8UJELAP+B+jd2FV66oKI+DAiHgAWAbdExFsR8TrwKLAnQETMjIg/R8RHETEPuAz4fNm5/i8i5kbE4pJ9BwDjgRMi4p50377ApsDFEbEkIv4K3FPyc9xS/1pSJ+DwdJ9ZkxzoVlUi4iPgVuD4tCtlCHBTWbO5Ja/nANukr7cFrki7Md4B3gZEcrXdmH+VvF7cwPamAJK2kjRO0uuS3gN+B3Ruoq56w0k+JTxUsm8bYG5ErCj7OerrHAsMkrQhMAh4OiLmNPEzmAEOdMteQ9N93gAcBxwEfBART5Qd71byujvwRvp6LvDNiNii5GujiHi8Beq8KK1194jYDDie5JdFqYZ+luFAd0m/LNn3BtCttO8//TleB4iIGSQBfxhwLEnAmzXLgW5Z+xewXemONMBXAL9g9atzgHMkfUJSN+DbwO/T/aOA8yXtCiBpc0n/1UJ1dgIWAu9I6gKcU+Gfex84FOgv6eJ031Mk3TvnSmovaQDwZWBcyZ8bC5wB9CfpQzdrlgPdsnYR8IO0m+Tskv03Ap8l6doo90dgCslNyHuB3wJExJ3AJcC4tFvkeZKr3JbwE5Kbm++m3/OOSv9gRLxDckP1MEkXpPcDjkhrmw9cDQyNiBdL/tgtwADgrxExv0V+Ass9RXiBC6s+koYCwyLic2X7A+gVETOzqcysevkK3aqOpI2B04DRWdditj5xoFtVkXQIMI+kb903A83WgLtczMxywlfoZmY54UA3M8uJzGaF69y5c/To0SOrb29mtl6aMmXK/IiobehYZoHeo0cPJk+enNW3NzNbL0lqdBoId7mYmeWEA93MLCcc6GZmOeFANzPLCQe6mVlOONDNzHKiokCXdKiklyTNlDSygeObS7pb0rPpgrcntnypZmbWlGYDPV19/CqSuZt3AYZI2qWs2QhgRkTsQTKH8y8kdWjhWs3MrAmVPFjUD5gZEbMAJI0DBgIzStoE0EmSSNZgfBtY1sK1mtka6jHy3orbzu54bMVtP9uze8VtnzvhuYrb2rqpJNC7sOrit3XAPmVtriRZ2fwNkqW6jilbANfMLFNF+OVWSR96+UK4sPpiuIeQLAe2DdAbuFLSZqudSBomabKkyfPmzVvjYs3MrHGVBHodq66y3pWVq6zXOxG4IxIzgVeBncpPFBGjI6JPRPSprW1wbhkzM1tLlQT6JKCXpJ7pjc7BJN0rpV4DDgKQ9ClgR2BWSxZqZmZNa7YPPSKWSToduB+oAa6LiOmShqfHRwEXANdLeo6ki+Y8r1RuZta2Kpo+NyImABPK9o0qef0G8MWWLc3MzNaEnxQ1M8sJB7qZWU440M3McsKBbmaWEw50M7OccKCbmeWEA93MLCcc6GZmOeFANzPLCQe6mVlOONDNzHLCgW5mlhMVTc5l1a8Iq7GYWdN8hW5mlhMOdDOznHCgm5nlhAPdzCwnKropKulQ4AqSJeiujYiLy46fAxxXcs6dgdqIeLsFa12NbwSama3U7BW6pBrgKuAwYBdgiKRdSttExKUR0TsiegPnAw+3dpibmdmqKuly6QfMjIhZEbEEGAcMbKL9EOCWlijOzMwqV0mgdwHmlmzXpftWI2lj4FDg9kaOD5M0WdLkefPmrWmtZmbWhEoCXQ3si0bafhn4W2PdLRExOiL6RESf2traSms0M7MKVBLodUC3ku2uwBuNtB2Mu1vMzDJRSaBPAnpJ6impA0lojy9vJGlz4PPAH1u2RDMzq0SzwxYjYpmk04H7SYYtXhcR0yUNT4+PSpseBTwQEYtarVqzCng4qxVVRePQI2ICMKFs36iy7euB61uqMDMzWzN+UtTMLCcc6GZmOeFANzPLCQe6mVlOONDNzHLCgW5mlhMOdDOznHCgm5nlhAPdzCwnHOhmZjnhQDczywkHuplZTjjQzcxywoFuZpYTDnQzs5xwoJuZ5URFgS7pUEkvSZopaWQjbQZImippuqSHW7ZMMzNrTrMrFkmqAa4CDiZZMHqSpPERMaOkzRbA1cChEfGapK1aq2AzM2tYJVfo/YCZETErIpYA44CBZW2OBe6IiNcAIuKtli3TzMyaU0mgdwHmlmzXpftKfQb4hKSJkqZIGtpSBZqZWWUqWSRaDeyLBs6zN3AQsBHwhKQnI+Ifq5xIGgYMA+jevfIV1M3MrHmVXKHXAd1KtrsCbzTQ5r6IWBQR84FHgD3KTxQRoyOiT0T0qa2tXduazcysAZUE+iSgl6SekjoAg4HxZW3+CBwgaQNJGwP7AC+0bKlmZtaUZrtcImKZpNOB+4Ea4LqImC5peHp8VES8IOk+YBqwArg2Ip5vzcLNzGxVlfShExETgAll+0aVbV8KXNpypZmZ2Zrwk6JmZjnhQDczywkHuplZTjjQzcxywoFuZpYTDnQzs5xwoJuZ5YQD3cwsJxzoZmY54UA3M8sJB7qZWU440M3McsKBbmaWEw50M7OccKCbmeWEA93MLCcc6GZmOVFRoEs6VNJLkmZKGtnA8QGS3pU0Nf36UcuXamZmTWl2CTpJNcBVwMFAHTBJ0viImFHW9NGI+FIr1GhmZhWo5Aq9HzAzImZFxBJgHDCwdcsyM7M1VUmgdwHmlmzXpfvK7SfpWUl/krRri1RnZmYVa7bLBVAD+6Js+2lg24hYKOlw4C6g12onkoYBwwC6d+++hqWamVlTKrlCrwO6lWx3Bd4obRAR70XEwvT1BKC9pM7lJ4qI0RHRJyL61NbWrkPZZmZWrpJAnwT0ktRTUgdgMDC+tIGkT0tS+rpfet4FLV2smZk1rtkul4hYJul04H6gBrguIqZLGp4eHwV8FThV0jJgMTA4Isq7ZczMrBVV0ode340yoWzfqJLXVwJXtmxpZma2JvykqJlZTjjQzcxywoFuZpYTDnQzs5xwoJuZ5YQD3cwsJxzoZmY54UA3M8sJB7qZWU440M3McsKBbmaWEw50M7OccKCbmeWEA93MLCcc6GZmOeFANzPLCQe6mVlOVBTokg6V9JKkmZJGNtGur6Tlkr7aciWamVklmg10STXAVcBhwC7AEEm7NNLuEpK1R83MrI1VcoXeD5gZEbMiYgkwDhjYQLtvAbcDb7VgfWZmVqFKAr0LMLdkuy7d9zFJXYCjgFE0QdIwSZMlTZ43b96a1mpmZk2oJNDVwL4o274cOC8iljd1oogYHRF9IqJPbW1tpTWamVkFNqigTR3QrWS7K/BGWZs+wDhJAJ2BwyUti4i7WqRKMzNrViWBPgnoJakn8DowGDi2tEFE9Kx/Lel64B6HuZlZ22o20CNimaTTSUav1ADXRcR0ScPT4032m5uZWduo5AqdiJgATCjb12CQR8TX170sMzNbU35S1MwsJxzoZmY54UA3M8sJB7qZWU440M3McsKBbmaWEw50M7OccKCbmeWEA93MLCcc6GZmOeFANzPLCQe6mVlOONDNzHLCgW5mlhMOdDOznHCgm5nlhAPdzCwnKgp0SYdKeknSTEkjGzg+UNI0SVMlTZb0uZYv1czMmtLsEnSSaoCrgIOBOmCSpPERMaOk2YPA+IgISbsDtwI7tUbBZmbWsEqu0PsBMyNiVkQsAcYBA0sbRMTCiIh0cxMgMDOzNlVJoHcB5pZs16X7ViHpKEkvAvcCJzV0IknD0i6ZyfPmzVubes3MrBGVBLoa2LfaFXhE3BkROwFHAhc0dKKIGB0RfSKiT21t7ZpVamZmTaok0OuAbiXbXYE3GmscEY8A20vqvI61mZnZGqgk0CcBvST1lNQBGAyML20gaQdJSl/vBXQAFrR0sWZm1rhmR7lExDJJpwP3AzXAdRExXdLw9Pgo4CvAUElLgcXAMSU3Sc3MrA00G+gAETEBmFC2b1TJ60uAS1q2NDMzWxN+UtTMLCcc6GZmOeFANzPLCQe6mVlOONDNzHLCgW5mlhMOdDOznHCgm5nlhAPdzCwnHOhmZjnhQDczywkHuplZTjjQzcxywoFuZpYTDnQzs5xwoJuZ5URFgS7pUEkvSZopaWQDx4+TNC39elzSHi1fqpmZNaXZQJdUA1wFHAbsAgyRtEtZs1eBz0fE7sAFwOiWLtTMzJpWyRJ0/YCZETELQNI4YCAwo75BRDxe0v5JoGtLFmn5snTpUurq6vjwww9b5fzXHLF1xW1f0K0Vt718g4pWbEzO+8ILFbddUx07dqRr1660b9++1b6HrZ8q+RvaBZhbsl0H7NNE+28Af1qXoizf6urq6NSpEz169EBSi59/ad07FbfduV3l339Fhw6Vn7fzzhW3XRMRwYIFC6irq6Nnz56t8j1s/VVJH3pDf+OjwYbSF0gC/bxGjg+TNFnS5Hnz5lVepeXKhx9+yJZbbtkqYZ53kthyyy1b7dONrd8qCfQ6oFvJdlfgjfJGknYHrgUGRsSChk4UEaMjok9E9KmtrV2bei0nHOZrz++dNaaSQJ8E9JLUU1IHYDAwvrSBpO7AHcDXIuIfLV+mmZk1p9k+9IhYJul04H6gBrguIqZLGp4eHwX8CNgSuDq9elgWEX1ar2zLkx4j723R840/ff8WPd+aOO7w47h5ws2NHj/88MMZO3YsW2yxRRtWZUVR0W37iJgATCjbN6rk9cnAyS1bmlm2li9fTk1NzRr9mabCHGDChAlNHjdbF35S1Arp9bmvMXBAP0749o/Y/T+P5qunnMMHixfTY5//x09/OZrPHXkSt93zF16ZPZdDjxvB3ocey9AvDWXWy7MAmP/WfM444QwGDRjEoAGDeObvzwDQd9u+ALz55pv079+f3r17s9tuu/Hoo48C0KNHD+bPnw/AZZddxm677cZuu+3G5ZdfDsDs2bPZeeedOeWUU9h111354he/yOLFi9v67bH1lAPdCmv2Ky8z7PhBTPvLrWzWaROuvuE2ADpu2IHH7rqOwQMPYdi5P+NXF5zHlPvGcvZPzuZn5/4MgIu+dxF99+vLHRPv4LYHb2OHnXZY5dxjx47lkEMOYerUqTz77LP07t17leNTpkxhzJgxPPXUUzz55JNcc801PPNM8kvh5ZdfZsSIEUyfPp0tttiC22+/vQ3eDcuDyp+UMMuZT2/Thf37JkF7/KDD+b/rxgFwzBFfBGDhog94fMo0/uub5wLwocSSJUsA+Ptjf+eiqy4CoKamhk6bdVrl3H379uWkk05i6dKlHHnkkasF+mOPPcZRRx3FJptsAsCgQYN49NFHOeKII+jZs+fH7ffee29mz57dCj+95ZED3QqrfPhf/fYmG28EwIoVK9his05M/XMS9NPX4MGi/v3788gjj3Dvvffyta99jXPOOYehQ4d+fDyiwUc5ANhwww0/fl1TU+MuF6uYu1yssN58vY4nJj8LwC1/vJ/P9V31KnqzTpvSs9s23Hb3n4EkhF98/kUA9jlgH34/5vdAcvN04fsLV/mzc+bMYauttuKUU07hG9/4Bk8//fQqx/v3789dd93FBx98wKJFi7jzzjs54IADWuXntOLwFbplbvbF/69Fzzetwkf/t+u1Izfcdg/fHHkhvXp259QTvsqvxoxbpc3NV17Iqef/Dz+74loWLl/OYUcdxk677cTIC0fyk+/+hDvG3kG7du344aU/pHfJL4SJEydy6aWX0r59ezbddFNuvPHGVc6711578fWvf51+/foBcPLJJ7Pnnnu6e8XWiQPdCksSoy75/ir7Zj+16pj4nt27cN/NVwGrdrl03qozv7rpV6udc9KcSQCccMIJnHDCCasdLw3ss846i7POOmuV4z169OD555//ePvss8+u8Kcxc5eLmVluONCtkLp0684dDz6RdRlmLcqBbmaWEw50M7OccKCbmeWEA93MLCc8bNGy9+PNW/Z8J89p2fNV6PXXXmfEcSO469G7mDhxIj//+c+55557MqnFislX6FZ4EcGKFSuyLsNsnfkK3Qrp9bmvMWLof3Hof+zBE1OmcebJxzLqpj/w0ZKlbL9tV8b88sdsusnGTJo6nW//6FIWfbCYFR035Ld3/JZ33n6H8087n8UfJHOsfO/i77Fnvz0z/onMHOhWYLNfeZmhl32Pn54znEEnn81ffj+KTTbeiEuuup7LRv+OkSNO5JhTR/L7X19M39678tRHS9iw44Z8svMnueYP17Bhxw2Z88oczvnmOdz6l1uz/nHMKgt0SYcCV5AsQXdtRFxcdnwnYAywF/D9iPh5Sxdq1tK27tqNfffenXv+/Agz/vEq+w88EYAlS5ey396789Irs9l6q8707b0rAJt22hSAxR8s5sKRF/LS8y/Rrl075szKps/erFyzgS6pBrgKOBioAyZJGh8RM0qavQ2cARzZKlWatYKNNtoYSPrQD+6/D7dcfdEqx6fN+MdqU+wC3DjqRras3ZLbJ97OihUr2Lvr3m1Sr1lzKrkp2g+YGRGzImIJMA4YWNogIt6KiEnA0lao0axV7bv37vxt0rPMfPU1AD5YvJh/vDKHnXboyRv/msekqdMBWLRwEcuWLWPhewup/VQt7dq14+5b72b58uVZlm/2sUq6XLoAc0u264B91uabSRoGDAPo3r372pzC8ujH77bs+SqcPrde7Zaf4Ppf/pghI77HR+mKRD87dwSf2X5bfv/ri/nWDy5h8YcfwcYbce0frmXwiYM586QzeWD8A/Tdvy8bpQtimGWtkkBf/TMnNL7cShMiYjQwGqBPnz5rdQ6zlrBycq5XATjwc/2YNOF3q7Xr23tXnrwnmcu8fvrcbTfdljsfvvPjNt/54XeSc3bvwl2P3gXAgAEDGDBgQCv+BGarq6TLpQ7oVrLdFXijdcoxM7O1VUmgTwJ6SeopqQMwGBjfumWZmdmaarbLJSKWSToduJ9k2OJ1ETFd0vD0+ChJnwYmA5sBKySdCewSEe+1Yu1mZlaionHoETEBmFC2b1TJ63+SdMWYmVlGPJeLmVlOONDNzHLCc7lY5j57w2db9Hw3H/Ro822u+w233XQde36mK2/8cx5PP/8iF543grOHD23RWszakgPdCunWG3/LVTfeRp9N5zOn7k3uuu+hrEsyW2fucrHCueD871D32my+fdIQbr5jAn1770r79r62sfWf/xZb4fzwol/y+MQHufbWu/l8Z4+stfzwFbqZWU440M3McsKBbmaWE+5Dt8w9d8JzLXq+aWswfe4/35pPn8OO572Fi2jXTlx+zVhmTPwDm6WrE5mtTxzoVkh/emIaAJ9u9x51U+7LuBqzluEuFzOznHCgm5nlhAPdMhHhBavWlt87a4wD3dpcx44dWbBggYNpLUQECxYsoGPHjlmXYlXIN0WtzXXt2pW6ujrmzZvXKuf/178XV9z2BVVewz83qPyfS7t5rXet1LFjR7p29fIDtjoHurW59u3b07Nnz1Y7/2Ej76247eyOx1bc9uie3Stu29JDMc0qUdFlhKRDJb0kaaakkQ0cl6T/S49Pk7RXy5dqZmZNaTbQJdUAVwGHAbsAQyTtUtbsMKBX+jUM+HUL12lmZs2o5Aq9HzAzImZFxBJgHDCwrM1A4MZIPAlsIWnrFq7VzMyaUEkfehdgbsl2HbBPBW26AG+WNpI0jOQKHmChpJfWqNp1oMYPdQbmr7rr+crP+/Umzlyl/F6s5PdiJb8XK1X5e7FtYwcqCfSGKigfb1ZJGyJiNDC6gu/ZZiRNjog+WddRDfxerOT3YiW/FytV+3tRSZdLHdCtZLsr8MZatDEzs1ZUSaBPAnpJ6impAzAYGF/WZjwwNB3tsi/wbkS8WX4iMzNrPc12uUTEMkmnA/cDNcB1ETFd0vD0+ChgAnA4MBP4ADix9UpucVXVBZQxvxcr+b1Yye/FSlX9XsiPX5uZ5YPncjEzywkHuplZTjjQzcxywoFuZtYESftXsq8aFPKmqKTPAOeQPHH18UifiDgws6LakKRpjR0CIiJ2b8t6siSpI3AM8G/gbuBc4ADgFeCCiJjfxB/PJUkbA98FukfEKZJ6ATtGxD0Zl5YJSU9HxF7N7asGRZ0+9zZgFHANsDzjWrKwguRJ3rEkIVb5BOL5cyOwFNiEJMSeB64EPgdcD3wps8qyMwaYAuyXbteR/JspVKBL2g/4D6BW0lklhzYjGcJddYoa6MsiorAzQkZEb0k7AUNIQn1G+t8HImJZpsW1vV0iYjdJGwB1EfH5dP99kp7NsrAMbR8Rx0gaAhARiyWtfxOyrLsOwKYkOdmpZP97wFczqagZRQ30uyWdBtwJfFS/MyLezq6kthURLwL/Dfy3pGNIrlQvAS7NtLC2twQ+foCufLqKIn56A1giaSPS+ZgkbU/Jv5OiiIiHgYclXR8RcwAktQM2jYj3sq2uYUXtQ3+1gd0REdu1eTEZkdSFZBqHo0j6j28F7oyIhZkW1sYkvUUyJbRI+tLH1R8Cjo6IT2VVW1YkHQz8gGT9gweA/YGvR8TELOvKiqSxwHCSX/BTgM2ByyKi6i5+ChnoRSfpYZKPkLcCfwBW+WRSpE8qkk5o6nhE3NBWtVQTSVsC+5L8YnuyiDeH60mamnZTHgfsDZwHTKnGwQOFDHRJ7YFTgf7pronAbyJiaWZFtSFJs1k5vXHpX4D6US6F+aRiq0v7y48DtouIn0rqDnw6Iv6ecWmZkDQd6E1yn+nKiHhY0rMRsUfGpa2mqH3ovwbaA1en219L952cWUVtKCJ6ZF1DtZA0hgbm7k9FRHyjLeupEleTjIQ6EPgp8D5wO9A3y6Iy9BtgNvAs8IikbUlujFadol6hr/bbtVp/47YGSTOA3wHjImJW1vVkSdJXGtjdHTgTqImIrm1cUubqx1hLeiYi9kz3FebfRyUkbVCNI8KK+qTo8vTOPQCStqNYIxqGkPSh/1nSU5LOlLRN1kVlISJur/8CniFZ8PxU4GKgqF1PS9PF4etHudSSXLEXkqRPSfqtpD+l27sATd57yUpRr9APInl4YhZJv/G2wIkR8VCmhWUgXZDkGOArJPPZ3xIR12RbVduStDPwfWBPkmGbv6vGq6+2kt78OwbYC7iBZMz1DyLitkwLy0ga5GOA70fEHukzC89ExGczLm01hQx0AEkbAjuSBPqLEVG4cbalJA0AfknyoM2GGZfTZiTdBvQBfk4y6meVT2pFGvFTKn3w7CCSfx8PRsQLGZeUGUmTIqJvWRfU1IjonXVt5Qp1U1TSgRHxV0mDyg5tL4mIuCOTwjIiqS9J98tXSG76jCZ5xLtI+pJ0LZxN8uh/6RORQcG6XdIHZ6ZFxG7Ai1nXUyUWpcM467ug9gXezbakhhUq0IHPA38FvtzAsQAKEeiS/gc4GniH5EGa/SOiLtuqsuERP6uKiBWSnpXUPSJey7qeKnEWybrJ20v6G1BLlT76X9gulyKTNAG4OCIeSbeHklylzwF+XOBuhi6sPgPnI9lVlA1JfyX55PJ3YFH9/og4IrOiMpJ+YtmX5L2o76J9qVqfWSnaFToAkr5NcpPjfZIZF/cCRkbEA5kW1nY+TTKrIJL6k4zo+BbJwxOjqdKrj9Yk6RKSG4EzWNmPHkDhAp1kQqrSWSZFMs9P4aSfWH4REfsB07OupzmFDHTgpIi4QtIhwFbAiSQBX5RAb1dyFX4MMDodtne7pKkZ1pWlI0nm/C70zfHUBunEVB9LJ+sqqgfS5xXuiCrv0ihqoNff+DocGBMRzxZsetANSh6MOAgYVnoso5qyNovk6eHCBrqkU4HTgO3KFkHpBPwtm6qqwlkk8+Uvl7SYlVNkbJZtWasr6j/eKZIeAHoC50vqRLEenLiFZFrQ+SSLWzwKIGkHqvTufRv4AJgq6UFWnVL5jOxKanNjgT8BFwEjS/a/X9T7KgAR0an5VtWhkDdF0xsdvYFZEfGOpE8CXSOisaXZcicderU1yaIWi9J9nyGZ6/npTIvLQGOzLhZ1tkVblaQjKJnMr1qX4ytqoO8PTI2IRZKOJ7kpekX9JPZmZvUkXUwy6ufmdNcQkulzRzb+p7JR1ECfBuwB7A7cBPwWGFSy/JgVTLoQ8kUkizp0rN/vqYQtzYveEbEi3a4hefS/6uZDL+rkXMvSu9UDSa7Mr2DVNQOteMaQTKG8DPgCyZJ8N2VakVWTLUpeb55ZFc0o6k3R9yWdTzIP+gHpb9z2Gddk2dooIh6UpLTr7ceSHiVZd9WK7SLgGUkPkYxw6Q+cn21JDStqoB8DHEsyHv2f6YosVbc+oLWpD9Ob5S9LOh14neQZBSu4iLhF0kSSfnQB50XEP7OtqmGF7EMHSFcd6RURf5G0McliBu9nXZdlI52o7AWSj9YXkHys/t+IeDLTwiwzkk6PiCvT17tGRO3Q8RIAAAkUSURBVNU/KVrIQJd0CsnDNJ+MiO3TG2KjIuKgjEszsypRv3JT+etqVtQulxFAP+ApgIh4WZI/XheQpMsj4kxJd9PA2qJFnJDKGrRePEle1ED/KCKW1D/tn65AUryPKgYrR7L8PNMqrBptIekoktGAm5Wvo1CN6ycUtcvlf0nmAh9KMsvgacCMiPh+poVZVZD0CaBbkZ4cttVJGtPE4YiIk9qsmAoVNdDbAd8AvkjyUep+4Npqn0nNWk86iuEIkk+tU4F5wMMRcVaWdZmticIFejrm/IaIOD7rWqx61K8XKelkkqvz/5Y0rRqfBrS2JWkLkk/zPVh18ZOqm7itcH3oEbFcUq2kDhGxJOt6rGpsIGlrkqX53PVmpSYATwLPUeWzshYu0FOzgb9JGs+qS2xdlllFlrWfknS9PRYRkyRtB7yccU1WHTquL11vhetyAZDU4OPcEfGTtq7FzKqbpO8AC4F7WHWu/KqbI76QgW5WLh359DOSBT/uI5mN88yI+F2mhVnmJI0ALiQZGVcfmFGNM3EWMtAbeYjkXWAy8JuI+LDtq7IsSZoaEb3TccdHAt8BHoqIPTIuzTIm6RVgn4iYn3UtzSnq9LmzSD5CXZN+vQf8C/hMum3FUz/b5uHALdX4cdoyM51kicKqV9SbontGRP+S7bslPRIR/SVV/QQ81irulvQiSZfLaZJqAX9SM4DlJOvNPkSVrzdb1ECvldQ9Il4DSKfP7Zwe81DGAoqIkZIuAd5Lh7YuIlkAxeyu9KvqFTXQvws8lvaNCehJclW2CeBFgQtI0tCS16WHbmz7aqyaRMQNkjqQdMkCvBQRS7OsqTGFvCkKIGlDYCeSQH/RN0KLTdKvSjY7AgcBT0fEVzMqyaqEpAEkF3qzSfKiG3BCRDySYVkNKmSgpwtanAVsGxGnpPOh7xgR92RcmlUJSZsDN3n6XJM0BTg2Il5Ktz9DcuN872wrW11RR7mMIekr3y/driMZg2xW7wOgV9ZFWFVoXx/mABHxD6p0DeKi9qFvHxHHSBoCEBGLVdZxasVS9mxCO2AX4NbsKrIqMlnSb1k5d/5xwJQM62lUUQN9iaSNSP8BS9qekuFIVkilC1wsA+ZERF1WxVhVOZVklbMzSPrQHwGuzrSiRhS1D/1g4AckV2EPAPsDX4+IiVnWZWa2LgoZ6ACStgT2JfmN++T68FivtR5J+wK/AnYGOgA1wKKI2CzTwiwzkp6jiaUpq3Gu/KJ2uRARC4B7ASTtKOmiiDgl47IsO1cCg4HbgD4kCxrskGlFlrUvpf8dkf63tA+9KqcCKNQoF0m7S3pA0vOSfibpU5JuBx4EZmRdn2UrImYCNRGxPCLGAF/IuibLTkTMiYg5wP4RcW5EPJd+jQQOybq+hhQq0Ekm3hoLfIVkzcinSSbq2iEifpllYZa5D9KnAZ+V9L/pHNibZF2UVYVNJH2ufkPSf1ClfzcK1YdeP0VqyfZcoEdELM+wLKsCkrYlmXGzA8nUuZsBv06v2q3AJO0NXAdsnu56BzgpIp7OrqqGFa0PvaOkPUluhEIyhe7u9WPQq/F/kLUuSQOBrhFxVbr9MLAVyc2wJwAHesFFxBRgD0mbkVwEv5t1TY0p2hX6Q00cjog4sM2Ksaog6W/A4IiYm25PBQ4ENgXGRMRBWdZn2UvnffoK0IOSi+CI+GlWNTWmUFfoEeGbXFauQ32Ypx5LF7d4O5190+yPJCuaTaHKH0As1BV6vXSNwJsj4p10+xPAkIioyqe/rPVImhkRDQ5PlPRKRGzf1jVZdZH0fETslnUdlSjaKJd6p9SHOUBE/BvwGPRiekrSav/vJX0T+HsG9Vj1eVzSZ7MuohJFvUKfBuwR6Q8vqQaYFhG7ZluZtTVJW5GsRvMRyTBWgL2BDYEjI+JfWdVm1UHSDJKHzF4l+XsikntuVfekaFED/VKSGxyjSEYzDAfmRsR3s6zLsiPpQKD+F/r0iPhrlvVY9UiHtK4mfeioqhQ10NsB3yRZlUYkE3Rd6/HoZtaY9NNcx/rt+jWJq0khA93MrFKSjgB+AWwDvAVsC7xQjV20hRq2KOnWiDi6sVnUqrFPzMwydwHJzKx/iYg9JX0BGJJxTQ0qVKAD307/+6UmW5mZrbQ0IhZIaiepXUQ8JOmSrItqSKGGLUbEm+nL0+pnUiuZUe20LGszs6r1jqRNSVYqulnSFSSrWlWdQvahS3o6IvYq2zfNXS5mVi59YngxyQXwcSSTdN2crqlQVQoV6JJOJbkS355VJ13qBPwtIo7PpDAzW2+kz60Mjoibs66lXNECfXPgE8BFwMiSQ++n83eYmQGQzq44AugCjAf+nG6fA0yNiIEZltegQgV6PUnbA3UR8ZGkAcDuwI2l0wGYWbFJ+iPwb5JplA8iuRjsAHw7IqZmWVtjihroU0nWjewB3E/y23fHiDg8y7rMrHpIei4iPpu+rgHmA90j4v1sK2tcoUa5lFgREcuAQcDlEfEdYOuMazKz6rK0/kX6FPmr1RzmULxx6PWWShpCsrL7l9N97TOsx8yqzx6S3ktfC9go3a6fnGuz7EprWFED/USSCbkujIhXJfUEfpdxTWZWRSKiJusa1lQh+9DNzPKoUFfonsvFzPKsUFfokraOiDfXp/mNzcwqVahANzPLs0J1udST9D6rd7m8C0wGvhsRs9q+KjOzdVPIQAcuA94AxpIMQRoMfBp4CbgOGJBZZWZma6mQXS6SnoqIfcr2PRkR+0p6NiL2yKo2M7O1VdgnRSUdXT9hvaSjS44V7zecmeVCUa/QtwOuAPZLdz0BfAd4Hdg7Ih7LqjYzs7VVyEA3M8ujQna5SOoq6U5Jb0n6l6TbJXXNui4zs3VRyEAHxpBMmbsNyeT1d6f7zMzWW4XscpE0NSJ6N7fPzGx9UtQr9PmSjpdUk34dD1Tdgq9mZmuiqFfo3YErSUa5BPA4cEZEvJZpYWZm66CQgd4QSWdGxOVZ12FmtrYc6ClJr0VE96zrMDNbW0XtQ2+Isi7AzGxdONBX8kcVM1uvFWq2xUamzYV0Adg2LsfMrEW5D93MLCfc5WJmlhMOdDOznHCgm5nlhAPdzCwnHOhmZjnx/wEl5RQS+jjrtwAAAABJRU5ErkJggg==\n",
|
||
"text/plain": [
|
||
"<Figure size 432x288 with 1 Axes>"
|
||
]
|
||
},
|
||
"metadata": {
|
||
"needs_background": "light"
|
||
},
|
||
"output_type": "display_data"
|
||
}
|
||
],
|
||
"source": [
|
||
"#type markov\n",
|
||
"x_train = train_df.iloc[:,0:5].values.copy()\n",
|
||
"y_train = train_df['label'].values.copy()\n",
|
||
"x_test = test_df.iloc[:,0:5].values.copy()\n",
|
||
"y_test = test_df['label'].values.copy()\n",
|
||
"lr_classifer = LogisticRegression()\n",
|
||
"lr_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = lr_classifer.predict(x_test)\n",
|
||
"lr_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"lr_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"lr_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"svm_classifer = SVC()\n",
|
||
"svm_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = svm_classifer.predict(x_test)\n",
|
||
"svm_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"svm_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"svm_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"gn_classifer = GaussianNB()\n",
|
||
"gn_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = gn_classifer.predict(x_test)\n",
|
||
"gn_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"gn_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"gn_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"tr_classifer = tree.DecisionTreeClassifier()\n",
|
||
"tr_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = tr_classifer.predict(x_test)\n",
|
||
"tr_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"tr_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"tr_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"rf_classifer = RandomForestClassifier()\n",
|
||
"rf_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = rf_classifer.predict(x_test)\n",
|
||
"rf_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"rf_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"rf_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"score_df = pd.DataFrame(np.zeros((5,3)),index = ['LogisticRegression', 'SVM', 'GaussianNB', 'tree', 'RandomForest'], \\\n",
|
||
" columns = ['precision', 'recall', 'f1'])\n",
|
||
"score_df.loc['LogisticRegression'] = [lr_precision, lr_recall, lr_f1]\n",
|
||
"score_df.loc['SVM'] = [svm_precision, svm_recall, svm_f1]\n",
|
||
"score_df.loc['GaussianNB'] = [gn_precision, gn_recall, gn_f1]\n",
|
||
"score_df.loc['tree'] = [tr_precision, tr_recall, tr_f1]\n",
|
||
"score_df.loc['RandomForest'] = [rf_precision, rf_recall, rf_f1]\n",
|
||
"ax = score_df.plot.bar(title='type markov')\n",
|
||
"fig = ax.get_figure()\n",
|
||
"fig.savefig('../figure/type.svg')\n",
|
||
"print(score_df.loc['RandomForest'])"
|
||
]
|
||
},
|
||
{
|
||
"cell_type": "code",
|
||
"execution_count": 15,
|
||
"metadata": {},
|
||
"outputs": [
|
||
{
|
||
"name": "stderr",
|
||
"output_type": "stream",
|
||
"text": [
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\linear_model\\logistic.py:430: FutureWarning: Default solver will be changed to 'lbfgs' in 0.22. Specify a solver to silence this warning.\n",
|
||
" warnings.warn(\"Default solver will be changed to 'lbfgs' in 0.22. \"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\linear_model\\logistic.py:467: FutureWarning: Default multi_class will be changed to 'auto' in 0.22. Specify the multi_class option to silence this warning.\n",
|
||
" warnings.warn(\"Default multi_class will be changed to 'auto' in\"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\svm\\base.py:189: FutureWarning: The default value of gamma will change from 'auto' to 'scale' in version 0.22 to account better for unscaled features. Set gamma explicitly to 'auto' or 'scale' to avoid this warning.\n",
|
||
" warnings.warn(\"The default value of gamma will change \"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\ensemble\\forest.py:244: FutureWarning: The default value of n_estimators will change from 10 in version 0.20 to 100 in 0.22.\n",
|
||
" warn(\"The default value of n_estimators will change from \"\n"
|
||
]
|
||
},
|
||
{
|
||
"name": "stdout",
|
||
"output_type": "stream",
|
||
"text": [
|
||
"precision 0.993148\n",
|
||
"recall 0.993148\n",
|
||
"f1 0.993148\n",
|
||
"Name: RandomForest, dtype: float64\n"
|
||
]
|
||
},
|
||
{
|
||
"data": {
|
||
"image/png": "\n",
|
||
"text/plain": [
|
||
"<Figure size 432x288 with 1 Axes>"
|
||
]
|
||
},
|
||
"metadata": {
|
||
"needs_background": "light"
|
||
},
|
||
"output_type": "display_data"
|
||
}
|
||
],
|
||
"source": [
|
||
"#type+length markov\n",
|
||
"x_train = train_df.iloc[:,0:10].values.copy()\n",
|
||
"y_train = train_df['label'].values.copy()\n",
|
||
"x_test = test_df.iloc[:,0:10].values.copy()\n",
|
||
"y_test = test_df['label'].values.copy()\n",
|
||
"lr_classifer = LogisticRegression()\n",
|
||
"lr_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = lr_classifer.predict(x_test)\n",
|
||
"lr_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"lr_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"lr_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"svm_classifer = SVC()\n",
|
||
"svm_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = svm_classifer.predict(x_test)\n",
|
||
"svm_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"svm_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"svm_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"gn_classifer = GaussianNB()\n",
|
||
"gn_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = gn_classifer.predict(x_test)\n",
|
||
"gn_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"gn_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"gn_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"tr_classifer = tree.DecisionTreeClassifier()\n",
|
||
"tr_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = tr_classifer.predict(x_test)\n",
|
||
"tr_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"tr_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"tr_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"rf_classifer = RandomForestClassifier()\n",
|
||
"rf_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = rf_classifer.predict(x_test)\n",
|
||
"rf_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"rf_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"rf_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"score_df = pd.DataFrame(np.zeros((5,3)),index = ['LogisticRegression', 'SVM', 'GaussianNB', 'tree', 'RandomForest'], \\\n",
|
||
" columns = ['precision', 'recall', 'f1'])\n",
|
||
"score_df.loc['LogisticRegression'] = [lr_precision, lr_recall, lr_f1]\n",
|
||
"score_df.loc['SVM'] = [svm_precision, svm_recall, svm_f1]\n",
|
||
"score_df.loc['GaussianNB'] = [gn_precision, gn_recall, gn_f1]\n",
|
||
"score_df.loc['tree'] = [tr_precision, tr_recall, tr_f1]\n",
|
||
"score_df.loc['RandomForest'] = [rf_precision, rf_recall, rf_f1]\n",
|
||
"ax = score_df.plot.bar(title='type+length markov')\n",
|
||
"fig = ax.get_figure()\n",
|
||
"fig.savefig('../figure/type_length.svg')\n",
|
||
"print(score_df.loc['RandomForest'])"
|
||
]
|
||
},
|
||
{
|
||
"cell_type": "code",
|
||
"execution_count": 17,
|
||
"metadata": {},
|
||
"outputs": [
|
||
{
|
||
"name": "stderr",
|
||
"output_type": "stream",
|
||
"text": [
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\linear_model\\logistic.py:430: FutureWarning: Default solver will be changed to 'lbfgs' in 0.22. Specify a solver to silence this warning.\n",
|
||
" warnings.warn(\"Default solver will be changed to 'lbfgs' in 0.22. \"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\linear_model\\logistic.py:467: FutureWarning: Default multi_class will be changed to 'auto' in 0.22. Specify the multi_class option to silence this warning.\n",
|
||
" warnings.warn(\"Default multi_class will be changed to 'auto' in\"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\svm\\base.py:189: FutureWarning: The default value of gamma will change from 'auto' to 'scale' in version 0.22 to account better for unscaled features. Set gamma explicitly to 'auto' or 'scale' to avoid this warning.\n",
|
||
" warnings.warn(\"The default value of gamma will change \"\n",
|
||
"c:\\python38\\lib\\site-packages\\sklearn\\ensemble\\forest.py:244: FutureWarning: The default value of n_estimators will change from 10 in version 0.20 to 100 in 0.22.\n",
|
||
" warn(\"The default value of n_estimators will change from \"\n"
|
||
]
|
||
},
|
||
{
|
||
"name": "stdout",
|
||
"output_type": "stream",
|
||
"text": [
|
||
"precision 0.99743\n",
|
||
"recall 0.99743\n",
|
||
"f1 0.99743\n",
|
||
"Name: RandomForest, dtype: float64\n"
|
||
]
|
||
},
|
||
{
|
||
"data": {
|
||
"image/png": "\n",
|
||
"text/plain": [
|
||
"<Figure size 432x288 with 1 Axes>"
|
||
]
|
||
},
|
||
"metadata": {
|
||
"needs_background": "light"
|
||
},
|
||
"output_type": "display_data"
|
||
}
|
||
],
|
||
"source": [
|
||
"#type+length+burst markov\n",
|
||
"x_train = train_df.iloc[:,0:15].values.copy()\n",
|
||
"y_train = train_df['label'].values.copy()\n",
|
||
"x_test = test_df.iloc[:,0:15].values.copy()\n",
|
||
"y_test = test_df['label'].values.copy()\n",
|
||
"lr_classifer = LogisticRegression()\n",
|
||
"lr_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = lr_classifer.predict(x_test)\n",
|
||
"lr_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"lr_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"lr_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"svm_classifer = SVC()\n",
|
||
"svm_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = svm_classifer.predict(x_test)\n",
|
||
"svm_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"svm_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"svm_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"gn_classifer = GaussianNB()\n",
|
||
"gn_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = gn_classifer.predict(x_test)\n",
|
||
"gn_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"gn_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"gn_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"tr_classifer = tree.DecisionTreeClassifier()\n",
|
||
"tr_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = tr_classifer.predict(x_test)\n",
|
||
"tr_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"tr_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"tr_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"rf_classifer = RandomForestClassifier()\n",
|
||
"rf_classifer.fit(x_train, y_train)\n",
|
||
"y_pred = rf_classifer.predict(x_test)\n",
|
||
"rf_precision = precision_score(y_test, y_pred, average='micro')\n",
|
||
"rf_recall = recall_score(y_test, y_pred, average='micro')\n",
|
||
"rf_f1 = f1_score(y_test, y_pred, average='micro')\n",
|
||
"\n",
|
||
"score_df = pd.DataFrame(np.zeros((5,3)),index = ['LogisticRegression', 'SVM', 'GaussianNB', 'tree', 'RandomForest'], \\\n",
|
||
" columns = ['precision', 'recall', 'f1'])\n",
|
||
"score_df.loc['LogisticRegression'] = [lr_precision, lr_recall, lr_f1]\n",
|
||
"score_df.loc['SVM'] = [svm_precision, svm_recall, svm_f1]\n",
|
||
"score_df.loc['GaussianNB'] = [gn_precision, gn_recall, gn_f1]\n",
|
||
"score_df.loc['tree'] = [tr_precision, tr_recall, tr_f1]\n",
|
||
"score_df.loc['RandomForest'] = [rf_precision, rf_recall, rf_f1]\n",
|
||
"ax = score_df.plot.bar(title='type+length+burst markov')\n",
|
||
"fig = ax.get_figure()\n",
|
||
"fig.savefig('../figure/type_length_burst.svg')\n",
|
||
"print(score_df.loc['RandomForest'])"
|
||
]
|
||
},
|
||
{
|
||
"cell_type": "code",
|
||
"execution_count": null,
|
||
"metadata": {
|
||
"collapsed": true
|
||
},
|
||
"outputs": [],
|
||
"source": []
|
||
}
|
||
],
|
||
"metadata": {
|
||
"kernelspec": {
|
||
"display_name": "Python 3",
|
||
"language": "python",
|
||
"name": "python3"
|
||
},
|
||
"language_info": {
|
||
"codemirror_mode": {
|
||
"name": "ipython",
|
||
"version": 3
|
||
},
|
||
"file_extension": ".py",
|
||
"mimetype": "text/x-python",
|
||
"name": "python",
|
||
"nbconvert_exporter": "python",
|
||
"pygments_lexer": "ipython3",
|
||
"version": "3.6.2"
|
||
}
|
||
},
|
||
"nbformat": 4,
|
||
"nbformat_minor": 2
|
||
}
|