Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
2
2021-180 Smart Assistant to ease the process of COVID-19 and Pneumonia disease detection
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
2021-180
2021-180 Smart Assistant to ease the process of COVID-19 and Pneumonia disease detection
Commits
f0a18db2
Commit
f0a18db2
authored
Jul 04, 2021
by
Dias M.H.V IT18121698
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Upload breathing model
parent
32106ed2
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
1769 additions
and
0 deletions
+1769
-0
breathing01.ipynb
breathing01.ipynb
+1769
-0
No files found.
breathing01.ipynb
0 → 100644
View file @
f0a18db2
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "c625fa1f",
"metadata": {},
"outputs": [],
"source": [
"import numpy as np"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "fe4eccb6",
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "2be1196b",
"metadata": {},
"outputs": [],
"source": [
"import matplotlib.pyplot as plt"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "61ab0aa3",
"metadata": {},
"outputs": [],
"source": [
"import sklearn.metrics as sm"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "710e86ff",
"metadata": {},
"outputs": [],
"source": [
"%matplotlib inline"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "66119972",
"metadata": {},
"outputs": [],
"source": [
"breathing_dataset = pd.read_csv('breathing.csv')"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "ac6f6630",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Age</th>\n",
" <th>Gender</th>\n",
" <th>Positivity</th>\n",
" <th>Time</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>24</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>16.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>27</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>71.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>21.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>25</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>55.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>28</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>35.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>150</th>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>43.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>151</th>\n",
" <td>23</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>45.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>152</th>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>45.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>153</th>\n",
" <td>48</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>14.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>154</th>\n",
" <td>49</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>16.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>155 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" Age Gender Positivity Time\n",
"0 24 1 0 16.0\n",
"1 27 0 0 71.0\n",
"2 19 0 1 21.0\n",
"3 25 1 0 55.0\n",
"4 28 0 1 35.0\n",
".. ... ... ... ...\n",
"150 19 0 1 43.0\n",
"151 23 1 1 45.0\n",
"152 12 0 1 45.0\n",
"153 48 1 1 14.0\n",
"154 49 0 1 16.0\n",
"\n",
"[155 rows x 4 columns]"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"breathing_dataset"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "0d04edae",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Age</th>\n",
" <th>Gender</th>\n",
" <th>Positivity</th>\n",
" <th>Time</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>155.000000</td>\n",
" <td>155.000000</td>\n",
" <td>155.000000</td>\n",
" <td>155.000000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>mean</th>\n",
" <td>31.832258</td>\n",
" <td>0.483871</td>\n",
" <td>0.651613</td>\n",
" <td>30.450258</td>\n",
" </tr>\n",
" <tr>\n",
" <th>std</th>\n",
" <td>12.995913</td>\n",
" <td>0.501360</td>\n",
" <td>0.478004</td>\n",
" <td>20.612098</td>\n",
" </tr>\n",
" <tr>\n",
" <th>min</th>\n",
" <td>10.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2.000000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25%</th>\n",
" <td>22.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>17.295000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50%</th>\n",
" <td>27.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1.000000</td>\n",
" <td>25.000000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75%</th>\n",
" <td>40.000000</td>\n",
" <td>1.000000</td>\n",
" <td>1.000000</td>\n",
" <td>38.000000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>max</th>\n",
" <td>79.000000</td>\n",
" <td>1.000000</td>\n",
" <td>1.000000</td>\n",
" <td>180.000000</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Age Gender Positivity Time\n",
"count 155.000000 155.000000 155.000000 155.000000\n",
"mean 31.832258 0.483871 0.651613 30.450258\n",
"std 12.995913 0.501360 0.478004 20.612098\n",
"min 10.000000 0.000000 0.000000 2.000000\n",
"25% 22.000000 0.000000 0.000000 17.295000\n",
"50% 27.000000 0.000000 1.000000 25.000000\n",
"75% 40.000000 1.000000 1.000000 38.000000\n",
"max 79.000000 1.000000 1.000000 180.000000"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"breathing_dataset.describe()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "e634ed26",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"sum(breathing_dataset.isnull().sum())"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "1cd86953",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Age 0\n",
"Gender 0\n",
"Positivity 0\n",
" Time 0\n",
"dtype: int64\n"
]
}
],
"source": [
"print(breathing_dataset.isnull().sum())"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "074b7f92",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.preprocessing import LabelEncoder"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "f2131141",
"metadata": {},
"outputs": [],
"source": [
"dataTransform = breathing_dataset.copy()"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "e9256db9",
"metadata": {},
"outputs": [],
"source": [
"labelencoder = LabelEncoder()"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "1fa32cda",
"metadata": {},
"outputs": [],
"source": [
"for data in breathing_dataset.columns:\n",
" dataTransform[data] = labelencoder.fit_transform(breathing_dataset[data])"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "c58c4992",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Age</th>\n",
" <th>Gender</th>\n",
" <th>Positivity</th>\n",
" <th>Time</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>10</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>13</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>49</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>5</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>14</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>11</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>42</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>14</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>26</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>150</th>\n",
" <td>5</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>34</td>\n",
" </tr>\n",
" <tr>\n",
" <th>151</th>\n",
" <td>9</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>35</td>\n",
" </tr>\n",
" <tr>\n",
" <th>152</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>35</td>\n",
" </tr>\n",
" <tr>\n",
" <th>153</th>\n",
" <td>33</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>154</th>\n",
" <td>34</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>8</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>155 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" Age Gender Positivity Time\n",
"0 10 1 0 8\n",
"1 13 0 0 49\n",
"2 5 0 1 14\n",
"3 11 1 0 42\n",
"4 14 0 1 26\n",
".. ... ... ... ...\n",
"150 5 0 1 34\n",
"151 9 1 1 35\n",
"152 1 0 1 35\n",
"153 33 1 1 6\n",
"154 34 0 1 8\n",
"\n",
"[155 rows x 4 columns]"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dataTransform"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "9a8e65fe",
"metadata": {},
"outputs": [],
"source": [
"Y = dataTransform['Positivity']"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "496ec58e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0 0\n",
"1 0\n",
"2 1\n",
"3 0\n",
"4 1\n",
" ..\n",
"150 1\n",
"151 1\n",
"152 1\n",
"153 1\n",
"154 1\n",
"Name: Positivity, Length: 155, dtype: int64"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Y"
]
},
{
"cell_type": "code",
"execution_count": 18,
"id": "fade6c35",
"metadata": {},
"outputs": [],
"source": [
"X = dataTransform.drop(['Positivity'], axis = 1)"
]
},
{
"cell_type": "code",
"execution_count": 19,
"id": "2687c8b6",
"metadata": {},
"outputs": [],
"source": [
"breathing_feature_list = list(X.columns)"
]
},
{
"cell_type": "code",
"execution_count": 20,
"id": "df9b7ed2",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"['Age', 'Gender', ' Time']"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"breathing_feature_list"
]
},
{
"cell_type": "code",
"execution_count": 21,
"id": "4ea9146d",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.model_selection import train_test_split"
]
},
{
"cell_type": "code",
"execution_count": 22,
"id": "ef17efb6",
"metadata": {},
"outputs": [],
"source": [
"X_train,X_test,Y_train,Y_test = train_test_split(X,Y,test_size = 0.2, random_state = 41)"
]
},
{
"cell_type": "code",
"execution_count": 23,
"id": "acabe819",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Age</th>\n",
" <th>Gender</th>\n",
" <th>Time</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>20</th>\n",
" <td>16</td>\n",
" <td>1</td>\n",
" <td>23</td>\n",
" </tr>\n",
" <tr>\n",
" <th>51</th>\n",
" <td>33</td>\n",
" <td>1</td>\n",
" <td>9</td>\n",
" </tr>\n",
" <tr>\n",
" <th>62</th>\n",
" <td>17</td>\n",
" <td>1</td>\n",
" <td>20</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>46</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>5</td>\n",
" <td>0</td>\n",
" <td>14</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>15</td>\n",
" <td>0</td>\n",
" <td>37</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>42</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>65</th>\n",
" <td>33</td>\n",
" <td>1</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>14</td>\n",
" <td>1</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>140</th>\n",
" <td>34</td>\n",
" <td>1</td>\n",
" <td>9</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>124 rows × 3 columns</p>\n",
"</div>"
],
"text/plain": [
" Age Gender Time\n",
"20 16 1 23\n",
"51 33 1 9\n",
"62 17 1 20\n",
"127 2 0 46\n",
"2 5 0 14\n",
".. ... ... ...\n",
"26 15 0 37\n",
"89 42 0 2\n",
"65 33 1 8\n",
"80 14 1 8\n",
"140 34 1 9\n",
"\n",
"[124 rows x 3 columns]"
]
},
"execution_count": 23,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"X_train"
]
},
{
"cell_type": "code",
"execution_count": 24,
"id": "3979a00d",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Age</th>\n",
" <th>Gender</th>\n",
" <th>Time</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" <td>29</td>\n",
" </tr>\n",
" <tr>\n",
" <th>143</th>\n",
" <td>22</td>\n",
" <td>0</td>\n",
" <td>17</td>\n",
" </tr>\n",
" <tr>\n",
" <th>68</th>\n",
" <td>14</td>\n",
" <td>0</td>\n",
" <td>38</td>\n",
" </tr>\n",
" <tr>\n",
" <th>67</th>\n",
" <td>20</td>\n",
" <td>1</td>\n",
" <td>26</td>\n",
" </tr>\n",
" <tr>\n",
" <th>154</th>\n",
" <td>34</td>\n",
" <td>0</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>40</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>11</td>\n",
" <td>1</td>\n",
" <td>11</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9</th>\n",
" <td>21</td>\n",
" <td>0</td>\n",
" <td>12</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>16</td>\n",
" <td>1</td>\n",
" <td>14</td>\n",
" </tr>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>9</td>\n",
" <td>1</td>\n",
" <td>13</td>\n",
" </tr>\n",
" <tr>\n",
" <th>133</th>\n",
" <td>10</td>\n",
" <td>1</td>\n",
" <td>19</td>\n",
" </tr>\n",
" <tr>\n",
" <th>71</th>\n",
" <td>10</td>\n",
" <td>1</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" <td>24</td>\n",
" </tr>\n",
" <tr>\n",
" <th>103</th>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>12</td>\n",
" </tr>\n",
" <tr>\n",
" <th>38</th>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>15</td>\n",
" </tr>\n",
" <tr>\n",
" <th>49</th>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>16</td>\n",
" </tr>\n",
" <tr>\n",
" <th>152</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>35</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>43</td>\n",
" <td>0</td>\n",
" <td>9</td>\n",
" </tr>\n",
" <tr>\n",
" <th>30</th>\n",
" <td>41</td>\n",
" <td>0</td>\n",
" <td>17</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>12</td>\n",
" <td>1</td>\n",
" <td>16</td>\n",
" </tr>\n",
" <tr>\n",
" <th>96</th>\n",
" <td>23</td>\n",
" <td>0</td>\n",
" <td>15</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>24</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>39</th>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>47</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>11</td>\n",
" <td>1</td>\n",
" <td>24</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>38</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>136</th>\n",
" <td>31</td>\n",
" <td>1</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>5</td>\n",
" <td>0</td>\n",
" <td>21</td>\n",
" </tr>\n",
" <tr>\n",
" <th>41</th>\n",
" <td>16</td>\n",
" <td>1</td>\n",
" <td>9</td>\n",
" </tr>\n",
" <tr>\n",
" <th>37</th>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>15</td>\n",
" </tr>\n",
" <tr>\n",
" <th>56</th>\n",
" <td>21</td>\n",
" <td>1</td>\n",
" <td>22</td>\n",
" </tr>\n",
" <tr>\n",
" <th>134</th>\n",
" <td>23</td>\n",
" <td>1</td>\n",
" <td>8</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Age Gender Time\n",
"116 6 1 29\n",
"143 22 0 17\n",
"68 14 0 38\n",
"67 20 1 26\n",
"154 34 0 8\n",
"113 40 0 3\n",
"23 11 1 11\n",
"9 21 0 12\n",
"120 16 1 14\n",
"22 9 1 13\n",
"133 10 1 19\n",
"71 10 1 2\n",
"118 6 1 24\n",
"103 7 0 12\n",
"38 8 0 15\n",
"49 7 1 16\n",
"152 1 0 35\n",
"146 43 0 9\n",
"30 41 0 17\n",
"6 12 1 16\n",
"96 23 0 15\n",
"107 24 0 3\n",
"39 10 0 47\n",
"148 11 1 24\n",
"126 38 1 6\n",
"136 31 1 8\n",
"128 5 0 21\n",
"41 16 1 9\n",
"37 8 0 15\n",
"56 21 1 22\n",
"134 23 1 8"
]
},
"execution_count": 24,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"X_test"
]
},
{
"cell_type": "code",
"execution_count": 25,
"id": "c1a60e76",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"20 1\n",
"51 1\n",
"62 1\n",
"127 0\n",
"2 1\n",
" ..\n",
"26 1\n",
"89 1\n",
"65 1\n",
"80 1\n",
"140 1\n",
"Name: Positivity, Length: 124, dtype: int64"
]
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Y_train"
]
},
{
"cell_type": "code",
"execution_count": 26,
"id": "90199cc3",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"116 0\n",
"143 0\n",
"68 0\n",
"67 1\n",
"154 1\n",
"113 1\n",
"23 1\n",
"9 1\n",
"120 1\n",
"22 0\n",
"133 0\n",
"71 0\n",
"118 0\n",
"103 1\n",
"38 0\n",
"49 1\n",
"152 1\n",
"146 1\n",
"30 1\n",
"6 0\n",
"96 1\n",
"107 1\n",
"39 1\n",
"148 1\n",
"126 1\n",
"136 1\n",
"128 0\n",
"41 1\n",
"37 0\n",
"56 1\n",
"134 1\n",
"Name: Positivity, dtype: int64"
]
},
"execution_count": 26,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Y_test"
]
},
{
"cell_type": "code",
"execution_count": 27,
"id": "89af21b6",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(124, 3)"
]
},
"execution_count": 27,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"X_train.shape"
]
},
{
"cell_type": "code",
"execution_count": 28,
"id": "8d018ac0",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(124,)"
]
},
"execution_count": 28,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Y_train.shape"
]
},
{
"cell_type": "code",
"execution_count": 29,
"id": "915b4485",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(31, 3)"
]
},
"execution_count": 29,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"X_test.shape"
]
},
{
"cell_type": "code",
"execution_count": 30,
"id": "03088479",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(31,)"
]
},
"execution_count": 30,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Y_test.shape"
]
},
{
"cell_type": "code",
"execution_count": 31,
"id": "5c6d11b4",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.ensemble import RandomForestClassifier"
]
},
{
"cell_type": "code",
"execution_count": 32,
"id": "e5348084",
"metadata": {},
"outputs": [],
"source": [
"randomforestclassifier = RandomForestClassifier(n_estimators=100)"
]
},
{
"cell_type": "code",
"execution_count": 33,
"id": "3bd114d1",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"RandomForestClassifier()"
]
},
"execution_count": 33,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"randomforestclassifier.fit(X_train,Y_train)"
]
},
{
"cell_type": "code",
"execution_count": 34,
"id": "dbee1d71",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"RandomForestClassifier()"
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"randomforestclassifier.fit(X_train,Y_train)"
]
},
{
"cell_type": "code",
"execution_count": 35,
"id": "9efae75d",
"metadata": {},
"outputs": [],
"source": [
"prediction_y = randomforestclassifier.predict(X_test)"
]
},
{
"cell_type": "code",
"execution_count": 36,
"id": "4f592694",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1,\n",
" 0, 1, 1, 1, 1, 1, 0, 1, 1], dtype=int64)"
]
},
"execution_count": 36,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"prediction_y"
]
},
{
"cell_type": "code",
"execution_count": 37,
"id": "fc2e5108",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Accuracy score is: 0.7419354838709677\n"
]
}
],
"source": [
"experiment_accuracy = sm.accuracy_score(Y_test, prediction_y)\n",
"print('Accuracy score is: ' , str(experiment_accuracy))"
]
},
{
"cell_type": "code",
"execution_count": 38,
"id": "baca14d3",
"metadata": {},
"outputs": [],
"source": [
"from sklearn import metrics"
]
},
{
"cell_type": "code",
"execution_count": 39,
"id": "e7e41e42",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Classification report: precision recall f1-score support\n",
"\n",
" Covid danger 0.64 0.64 0.64 11\n",
"not Covid danger 0.80 0.80 0.80 20\n",
"\n",
" accuracy 0.74 31\n",
" macro avg 0.72 0.72 0.72 31\n",
" weighted avg 0.74 0.74 0.74 31\n",
"\n"
]
}
],
"source": [
"print(\"Classification report: \" , metrics.classification_report(prediction_y,Y_test,target_names=[\"Covid danger\", \"not Covid danger\"]))"
]
},
{
"cell_type": "code",
"execution_count": 40,
"id": "b4381ed6",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.metrics import confusion_matrix"
]
},
{
"cell_type": "code",
"execution_count": 41,
"id": "89aca29f",
"metadata": {},
"outputs": [],
"source": [
"import seaborn as sb"
]
},
{
"cell_type": "code",
"execution_count": 42,
"id": "2e1efd5d",
"metadata": {},
"outputs": [],
"source": [
"sb.set()"
]
},
{
"cell_type": "code",
"execution_count": 43,
"id": "2e8f7bff",
"metadata": {},
"outputs": [],
"source": [
"get_ipython().run_line_magic('matplotlib','inline')"
]
},
{
"cell_type": "code",
"execution_count": 44,
"id": "a297a2b9",
"metadata": {},
"outputs": [],
"source": [
"import matplotlib.pyplot as pt"
]
},
{
"cell_type": "code",
"execution_count": 45,
"id": "a797bdf7",
"metadata": {},
"outputs": [],
"source": [
"confusionmt = confusion_matrix(Y_test,prediction_y)"
]
},
{
"cell_type": "code",
"execution_count": 46,
"id": "921b0485",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Text(89.18, 0.5, 'predicted class axis')"
]
},
"execution_count": 46,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAQkAAAEJCAYAAACHaNJkAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuNCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8QVMy6AAAACXBIWXMAAAsTAAALEwEAmpwYAAAQt0lEQVR4nO3dffhnc53H8ecwIyRqNbuMkkjvEgaRMJUxyKKlMau2cjOF1TTSlaSSNlrbTu0KrawJyV0lpRUKIXdNwlZG6n1t4nIzmtxkKzfLzPz2j/Od6Wea3+d3hjm/c36+z8d1ub7fc743522u+b7mcz6fz/mcMQMDA0jSUFZquwBJ3WZISCoyJCQVGRKSigwJSUWGhKSisW0XUMd7N5jmOO0ocva8OW2XoOW04Kn7xwz1mi0JSUWGhKQiQ0JSkSEhqciQkFRkSEgqMiQkFRkSkooMCUlFhoSkIkNCUpEhIanIkJBUZEhIKjIkJBUZEpKKDAlJRYaEpCJDQlKRISGpyJCQVGRISCoyJCQVGRKSigwJSUWGhKQiQ0JSkSEhqciQkFRkSEgqMiQkFRkSkooMCUlFhoSkIkNCUpEhIanIkJBUZEhIKjIkJBUZEpKKDAlJRYaEpCJDQlKRISGpyJCQVGRISCoyJCQVGRKSigwJSUVj2y6gH+0wbUd2mDYZgHEvGMf6m2zAh7Y5iCf+8HjLlalk/Pi1+cmPv89uu7+TzDvbLmfEGBItuPHCH3LjhT8E4D3HHcQNF1xtQHTc2LFjOfVLs3jiySfbLmXENRYSEfEaYBrwMmARMA/4fmbe0tQxR5sNNtuICa9+Oed+6vS2S9EwPjfrGGbPPoejPjqz7VJGXCN9EhExA/h6b/Nm4L97z78cEUc0cczRaI8PTOXiky5ouwwNY//99uWhhx7hiiuvbbuUVjTVkjgc2DIzn9GGjogTqALj3xs67qix2pqrs+5GE/jVnF+0XYqGMf3AdzAwMMCUnSYxceLrOOvMk9h76nTmz3+w7dJGRFMhsQAYt4z9qwFPN3TMUSXesAl33DC37TJUw+Qp+yx5ftWV32TGzI/1TUBAcyFxPPDTiLgKeAAYACYAOwFHN3TMUWWdDSfw4L3z2y5DGtaYgYGB2m+OiFWAdTLznhrvnQDsTBUOKwH3AT/IzHnLW+R7N5hWv0i17ux5c9ouQctpwVP3jxnqtWFbEhHxdqoWwCeAucBaEfHpzDyp9LleGJy9nLVK6pg6oxsfB2YD+wBzgPWB/ZosSlJ31AmJMZk5l+rU4XuZ+cean5P0PFDnx74oIvYF3gpcERG7U02OktQH6oTEEcAhwNGZ+Vuq0YnDG61KUmcM23GZmTdQnWos3t6h0YokdcqQIRERF2TmvhExl2qewzNk5uaNViapE0otiVm9x/67okXSEkOGRGbe2nv68sw8d/H+iFiZakZlf17tIvWZOtOyPxERO1B1Vk4AvgH0z8R1qc/VGd3YhupirVuB64EvZ+aejVYlqTPqhMQA8H/A6r33O0dC6iN1QuI2YE1gIvAW4NCIuLjRqiR1Rp0+ieMyc/GFWr/u9U8c32BNkjqkzmSqsyPir4AXAmOAlYErmy5MUjfUuVT8OKorQaFacWoV4A5gswbrktQRdfok9qe6PPxCYGPgQMCFGaU+USckfpeZDwC/BCZm5jnYipD6Rp2QeDoiNgISeFNEjAVWbbYsSV1RJyQ+S7Uy1SXAVOBe4Oomi5LUHXVGNy6hCggiYguqfonbmi1LUlcs15L6vZvt/LyhWiR1kGtVSioyJCQV1QqJiNiw97hHRBwTEWs1W5akrhg2JCLiNOCoiHgt8GVgQ+DMpguT1A11WhKvB94PvB34amZOB17RaFWSOqNOSKyUmYuAXfjz/IjVmytJUpfUCYlfR8RlVKcZ10bEeThPQuobdUJiOnA+8JbMfIpqCbv3NlqVpM4YNiQy8zHgR5l5d0TsAYynWvNSUh9wdENSkaMbkooc3ZBUtLyjGz90dEPqL8s7uvE01ejG9EarktQZdUc3LgMWRsT6wOXApKYLk9QNrpYtqcjVsiUVuVq2pCJXy5ZUtLyrZe9DtVr2NU0WJak7lne17InAxpnpYrhSnxgyJCLi5MJrZOYHmylJUpeUWhIPj1gVkjpryJDIzGMBImIcsG9mnhcR6wDvBIZsZUh6fqnTcXkKsGfv+SLgTcCJTRUkqVvqhMT2mfkPAJn5O+DvgcmNViWpM+qExLiIWGXQ9nLdGlDS6FbnB38pcHlEnAMMAO/q7ZPUB+qExJHAB4C9qC7w+jZwWpNFLe3seXNG8nB6jp6Yd33bJWgFGjMwMNB2DcMau8p63S9SSxgSo8+4l244ZqjXvGGwpCJDQlKRISGpqHTtxqdKH8zM41Z8OZK6pjS6Mb73+BoggIuoRjf2wtWypb5RunbjMICIuBrYKjMf6m3/M/BfI1OepLbV6ZNYd3FA9DwK/HUz5UjqmjqTqW6LiK8AZwNjgPcBNzValaTOqNOSOIiq9XAS1dWf9wGHNleSpC6pNeMyIlajWk7/dmDVzHy86cIGc8bl6OKMy9HnOc24jIg3AndSrXM5Abg3IrZfceVJ6rI6pxufB3YGHs7M+4D9qE49JPWBOiGxembesXgjMy/DNSWkvlH35jwvoVpLgoiIZkuS1CV1WgTHA9cC60TE14BdgUMarUpSZ9Qd3XgVsAuwMnBVZv6y6cIGc3RjdHF0Y/QpjW4M25KIiDMy833ArwftuzAzp62g+iR1WOkq0FOB9ahuEjx+0EvjgA2bLkxSN5RaEmcAmwITgW8N2r8A+HGTRUnqjiFHNzLzlsw8C9gBuCszvwp8F3gsM+8cofoktazOEOj7gWN7z1cHPhYRn2yuJEldUick9qIa9qQ34/ItVPcDldQHat3BKzOfHrT9FNU9QSX1gTqTqW6MiPOoOjIHgANwPQmpb9RpSRwGzAe+APxb7/nhTRYlqTu8g5dWOGdcjj7PasZlRFyQmftGxFx6F3cNlpmbr6D6JHVYqU9iVu9x5kgUIqmbSiHxYESsD9w1UsVI6p5SSPyC6jRjJWA14I/AQuDFwO+AdZsuTlL7StOyX5SZawLnAe/OzBdn5trA24HvjVSBktpVZwh068z8+uKNzLwY2KKxiiR1Sp2QWCkidly8ERG74YxLqW/UmXH5QeCCiHiK6g5eY4C9myxKUnfUXb5uHLBZb/O2zFzQaFVLcTLV6OJkqtHnud6cZw2qKdmfB+4GTuntk9QH6vRJnAz8L/A3wJPAmsDsJouS1B11QmLLzDwaeLp3D9B34+iG1DfqhMTCpbZXxtENqW/UCYnrImIWsFpEvBX4NnBNs2VJ6oo6IXEU8CeqfonjgduAI5ssSlJ31JkncVxmfhz4TNPFSOqeOi2JPRuvQlJn1WlJ/CYirgBuoDrtACAzT2isKkmdUSckHuk9vnLQPmdASn2i9hqXEfESYGFm/qHZkv6S07JHF6dljz7PdVp2RMTNVAvNPBwR1/ZWrJLUB+p0XJ4FnE51i781gAup7sEhqQ/U6ZNYPTNPG7T9xYg4uKmCJHVLnZbEryJi+8UbEbEpLo77nI0fvzZ33XkzERu1XYoKbvvFrzhw5kcBePj3j3LYUcdywIwjec+hR3DPffNarm5k1GlJvAK4NiJ+DiwAtgR+GxG3gfffeDbGjh3LqV+axRNPPtl2KSo487xv8t3vX81qq74AgBNOOYM9dp3MblPezE9u/Tl33XMf679sQstVNq/utOydgSN6z3cF9qe6/d9hzZX2/PW5Wccwe/Y5PDDvt22XooKXT1iXE//lk0u2fzr3DuY/+BAHHf5xLrniGrbZsj/+fRy2JZGZ1y7vlw43+pGZ9yzvdz5f7L/fvjz00CNcceW1HPVR73vUZbtMnsT9D8xfsj3vgfms+aI1OP2kz3Lqmedx5rkXMPPg/VuscGTUOd14Ni4FNgbmUa2JOdgAsGFDx+286Qe+g4GBAabsNImJE1/HWWeexN5TpzN//oNtl6ZhrLXWmkye9EYAdpy0LSef9tWWKxoZTYXEDsD1wIzMvLGhY4xKk6fss+T5VVd+kxkzP2ZAjBJbbb4J1825mb/bbQq3/Ox2NnrlK9ouaUTU6ZNYbr1ZmQcDBzTx/VIbjjzsYC7+3lW8+x8/zI033crB+7+j7ZJGRO1p2W1yWvbo4rTs0ec5TcuW1N8MCUlFhoSkIkNCUpEhIanIkJBUZEhIKjIkJBUZEpKKDAlJRYaEpCJDQlKRISGpyJCQVGRISCoyJCQVGRKSigwJSUWGhKQiQ0JSkSEhqciQkFRkSEgqMiQkFRkSkooMCUlFhoSkIkNCUpEhIanIkJBUZEhIKjIkJBUZEpKKDAlJRYaEpCJDQlKRISGpyJCQVGRISCoyJCQVGRKSigwJSUWGhKQiQ0JSkSEhqciQkFRkSEgqMiQkFRkSkooMCUlFYwYGBtquQVKH2ZKQVGRISCoyJCQVGRKSigwJSUWGhKQiQ0JSkSEhqciQkFQ0tu0C+lVEvAv4JDAOODEzT2m5JA0jItYEfgTsmZl3t1zOiLEl0YKIWA84HpgEbAEcEhGbtFqUiiJiW+AG4NVt1zLSDIl27AxcnZmPZOZjwIXAtJZrUtnBwAeAeW0XMtI83WjHBOCBQdsPAG9oqRbVkJkHAURE26WMOFsS7VgJGHz57RhgUUu1SEWGRDvuA9YdtL0OfdiM1ejg6UY7fgB8OiLGA48B+wCHtFuStGy2JFqQmfcDRwPXAD8Dzs/Mn7RalDQEV6aSVGRLQlKRISGpyJCQVGRISCoyJCQVGRKjXERcEREvbeG4A20ctyQiTo+Induu4/nGyVSj3y5tF9AVi6+v0IrlPIlRLCK+AhwI3A7sDlwP3ARsDnwC+AIwLTNv6b3/7sXbEbE9MAt4IbAQODYzL1nGMbYFTu697yngI5l5dUQMAOOBJ4BTgY2BtYE/Au/KzIyIqVRrZizqHePIzLxuqP1LHfeFy/pe4B7gFuCUzPxSRLwP+BCwLXAZ8B/Ad4AvAjsATwO/AaZn5p+W+w9Znm6MZpk5vfd0cmbe23t+e2a+NjMvGupzEfES4CvAfpm5FbAXcGpErL/U+8ZR/eCOy8xNqS6XPikiBv+9+Vvg0czcLjNfDdwMzOy99nlgRmZuDRwD7DjM/sGW+b2Z+QTwTuC4iNidal2OaZn5+KDPbtf7zomZ+XqqkNh8qD8PlXm68fxzfY33bEd1gdl3Bl36PED1Q7pn0Ps2AxZm5qUAmXlrb9+SS6Yz88KI+E1EHAa8iurHOaf3+a8DF0XEpcCVwOeG2b9E6Xszc25EHAtcAhyQmbnUx+dStVBuiojLgW857f3ZsyXx/DO4ST1AdRn6Yqv0HlcGfpmZWyz+D3gjcPlS37WAZ17STkRsGhFjB22/HzgDeBw4H/ja4mNm5tFUq2/dQnVadF1p/1LHGfJ7e14HzO/V/QyZ+SgwEfgIVVh8IyJmLP0+1WNIjH4LqdbJXJYHga0BImJH/nx5+o+BjSPizb3XtgD+B1hvqc8nMBARu/TetxVwNc/8e/NW4KzMPKP3/rcBK0fE2F4fyOqZ+Z/ADGDziHjBUPuXOvYyv7dXx1RgJ6qWz64RsffgD0bEnsBVwI8y89PA2cA2Q/wZaRh2XI5yEfE14PXAVKrm9+COyslUnX9PArdS/et6aK/jcjLwr8CqVD/6f8rMby/j+7cGTgTWoOq4/HBm3jCo4/I1wGyqVscYqlOCzTJzu96P9zNUnYeLgBMy8/yh9i913EnL+l5g397/y9sy86ZeB+x3gK2Ac6k6Li+i6mydQtWy+j1wcD8tXrsiGRKSijzdkFRkSEgqMiQkFRkSkooMCUlFhoSkIkNCUpEhIano/wGuI5Tmorcb4QAAAABJRU5ErkJggg==\n",
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"sb.heatmap(confusionmt.T, square=True, annot=True,fmt='d', cbar=False)\n",
"pt.xlabel('true class axis')\n",
"pt.ylabel('predicted class axis')"
]
},
{
"cell_type": "code",
"execution_count": 47,
"id": "6aeb3e95",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Text(0, 0.5, 'predicted class axis')"
]
},
"execution_count": 47,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"pt.xlabel('true class axis')\n",
"pt.ylabel('predicted class axis')"
]
},
{
"cell_type": "code",
"execution_count": 48,
"id": "89e6b6c0",
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"<ipython-input-48-6223ed64eca5>:3: UserWarning: To output multiple subplots, the figure containing the passed axes is being cleared\n",
" breathing_dataset.hist(ax = axis)\n"
]
},
{
"data": {
"text/plain": [
"array([[<AxesSubplot:title={'center':'Age'}>,\n",
" <AxesSubplot:title={'center':'Gender'}>],\n",
" [<AxesSubplot:title={'center':'Positivity'}>,\n",
" <AxesSubplot:title={'center':' Time'}>]], dtype=object)"
]
},
"execution_count": 48,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 1440x1800 with 4 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"figures = plt.figure(figsize = (20,25))\n",
"axis = figures.gca()\n",
"breathing_dataset.hist(ax = axis)"
]
},
{
"cell_type": "code",
"execution_count": 49,
"id": "94980da4",
"metadata": {},
"outputs": [],
"source": [
"import pickle\n",
"with open('framingham_classifier_randomforestclassifier', 'wb') as picklefile1:\n",
" pickle.dump(randomforestclassifier,picklefile1)"
]
},
{
"cell_type": "code",
"execution_count": 50,
"id": "296183c0",
"metadata": {},
"outputs": [],
"source": [
"with open('framingham_classifier_randomforestclassifier', 'rb') as training_model1:\n",
" model6 = pickle.load(training_model1)"
]
},
{
"cell_type": "code",
"execution_count": 51,
"id": "2b3420e2",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.preprocessing import MinMaxScaler\n",
"scaler = MinMaxScaler(feature_range=(0,1)) \n",
"\n",
"#assign scaler to column:\n",
"breathing_dataset_scaled = pd.DataFrame(scaler.fit_transform(breathing_dataset), columns=breathing_dataset.columns)"
]
},
{
"cell_type": "code",
"execution_count": 59,
"id": "c04f8a06",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Input Patient Information:\n",
"Patient's age: >>> 52\n",
"Patient's gender. male=0, female=1: >>> 1\n",
"Patient's breathing Time: >>> 18\n",
"\n",
"\n",
"Result:\n",
"The patient is in danger.\n"
]
}
],
"source": [
"def start_questionnaire():\n",
" my_predictors = []\n",
" parameters=['Age', 'Gender','Time']\n",
" \n",
" print('Input Patient Information:')\n",
" \n",
" Age = input(\"Patient's age: >>> \") \n",
" my_predictors.append(Age)\n",
" Gender = input(\"Patient's gender. male=0, female=1: >>> \") \n",
" my_predictors.append(Gender)\n",
" Time = input(\"Patient's breathing Time: >>> \") \n",
" my_predictors.append(Time)\n",
" \n",
"\n",
" my_data = dict(zip(parameters, my_predictors))\n",
" my_df = pd.DataFrame(my_data, index=[0])\n",
" scaler = MinMaxScaler(feature_range=(0,1)) \n",
"\n",
" # assign scaler to column:\n",
" my_df_scaled = pd.DataFrame(scaler.fit_transform(my_df), columns=my_df.columns)\n",
" my_y_pred = model6.predict(my_df)\n",
" print('\\n')\n",
" print('Result:')\n",
" if my_y_pred == 1:\n",
" print(\"The patient is in danger.\")\n",
" if my_y_pred == 0:\n",
" print(\"The patient is not in danger.\")\n",
"\n",
"start_questionnaire()"
]
},
{
"cell_type": "code",
"execution_count": 53,
"id": "fd000e4b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"dtype('O')"
]
},
"execution_count": 53,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"breathing_dataset.dtypes.dtypes"
]
},
{
"cell_type": "code",
"execution_count": 54,
"id": "8a25cd18",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.tree import DecisionTreeClassifier"
]
},
{
"cell_type": "code",
"execution_count": 55,
"id": "39e9b76b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"DecisionTreeClassifier(max_depth=3, random_state=0)"
]
},
"execution_count": 55,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"clf = DecisionTreeClassifier(criterion='gini', max_depth=3, random_state=0)\n",
"\n",
"clf.fit(X_train, Y_train)"
]
},
{
"cell_type": "code",
"execution_count": 56,
"id": "b1771cd1",
"metadata": {},
"outputs": [],
"source": [
"y_pred_gini = clf.predict(X_test)"
]
},
{
"cell_type": "code",
"execution_count": 57,
"id": "fbe51032",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Model accuracy score with decision tree classifier: 0.6774193548387096\n"
]
}
],
"source": [
"from sklearn.metrics import accuracy_score\n",
"\n",
"print('Model accuracy score with decision tree classifier: ', accuracy_score(Y_test, y_pred_gini))"
]
},
{
"cell_type": "code",
"execution_count": 58,
"id": "be0b08ad",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Model accuracy score with logistic regression classifier: 0.6129032258064516\n"
]
}
],
"source": [
"from sklearn.linear_model import LogisticRegression\n",
"logreg=LogisticRegression()\n",
"logreg.fit(X_train,Y_train)\n",
"y_pred1 =logreg.predict(X_test)\n",
"\n",
"\n",
"from sklearn import metrics\n",
"\n",
"print('Model accuracy score with logistic regression classifier: ', metrics.accuracy_score(Y_test,y_pred1))\n",
"#print(metrics.classification_report(y_test,y_pred)),metrics.confusion_matrix(y_test,y_pred)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "090bf27a",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.8"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment