Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
2
2023-362
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
2023-362
2023-362
Commits
3b68e467
Commit
3b68e467
authored
Nov 03, 2023
by
Nirmal M.D.S
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Upload New File
parent
00259407
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
1587 additions
and
0 deletions
+1587
-0
IT20074340/Final_Naive_Bayes_Prediction.ipynb
IT20074340/Final_Naive_Bayes_Prediction.ipynb
+1587
-0
No files found.
IT20074340/Final_Naive_Bayes_Prediction.ipynb
0 → 100644
View file @
3b68e467
{
"cells"
:
[
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"id"
:
"pIPRzpKBdHYW"
,
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"outputId"
:
"8e883495-ed72-4704-ee9d-f9c5a6465ebf"
},
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
"Mounted at /content/drive
\n
"
]
}
],
"source"
:
[
"from google.colab import drive
\n
"
,
"drive.mount('/content/drive')"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"EQWrFYcidIGL"
,
"outputId"
:
"6035b7de-c51d-4374-b143-01fa48ba3934"
},
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
"/content/drive/My Drive/PP1 Practice
\n
"
]
}
],
"source"
:
[
"%cd
\"
/content/drive/My Drive/PP1 Practice/
\"
"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"id"
:
"7cIHFinPt0KH"
},
"outputs"
:
[],
"source"
:
[
"#import packages
\n
"
,
"import pandas as pd
\n
"
,
"from sklearn.feature_extraction.text import TfidfVectorizer
\n
"
,
"from sklearn.feature_extraction.text import CountVectorizer
\n
"
,
"from sklearn.model_selection import train_test_split
\n
"
,
"from sklearn.naive_bayes import MultinomialNB
\n
"
,
"
\n
"
,
"from sklearn.metrics import classification_report
\n
"
,
"from sklearn.metrics import accuracy_score"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
,
"height"
:
206
},
"id"
:
"rl4NpPiKt4Y-"
,
"outputId"
:
"d2a60f7e-080a-456e-bf64-07586069b272"
},
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
" ProjectName TaskDescription
\\\n
"
,
"0 E-commerce Website Implement a user registration and login system...
\n
"
,
"1 Mobile App Development Develop a push notification feature for the mo...
\n
"
,
"2 Data Analytics Platform Build a data visualization module that present...
\n
"
,
"3 CRM System Upgrade Enhance the existing customer relationship man...
\n
"
,
"4 Bug Tracking Tool Create a web-based bug tracking tool that allo...
\n
"
,
"
\n
"
,
" Level
\n
"
,
"0 Low
\n
"
,
"1 Low
\n
"
,
"2 Low
\n
"
,
"3 Low
\n
"
,
"4 Low "
],
"text/html"
:
[
"
\n
"
,
" <div id=
\"
df-65fab58d-70aa-44dc-b052-21323b44bec0
\"
class=
\"
colab-df-container
\"
>
\n
"
,
" <div>
\n
"
,
"<style scoped>
\n
"
,
" .dataframe tbody tr th:only-of-type {\n"
,
" vertical-align: middle;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe tbody tr th {\n"
,
" vertical-align: top;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe thead th {\n"
,
" text-align: right;
\n
"
,
" }
\n
"
,
"</style>
\n
"
,
"<table border=
\"
1
\"
class=
\"
dataframe
\"
>
\n
"
,
" <thead>
\n
"
,
" <tr style=
\"
text-align: right;
\"
>
\n
"
,
" <th></th>
\n
"
,
" <th>ProjectName</th>
\n
"
,
" <th>TaskDescription</th>
\n
"
,
" <th>Level</th>
\n
"
,
" </tr>
\n
"
,
" </thead>
\n
"
,
" <tbody>
\n
"
,
" <tr>
\n
"
,
" <th>0</th>
\n
"
,
" <td>E-commerce Website</td>
\n
"
,
" <td>Implement a user registration and login system...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>1</th>
\n
"
,
" <td>Mobile App Development</td>
\n
"
,
" <td>Develop a push notification feature for the mo...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>2</th>
\n
"
,
" <td>Data Analytics Platform</td>
\n
"
,
" <td>Build a data visualization module that present...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>3</th>
\n
"
,
" <td>CRM System Upgrade</td>
\n
"
,
" <td>Enhance the existing customer relationship man...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>4</th>
\n
"
,
" <td>Bug Tracking Tool</td>
\n
"
,
" <td>Create a web-based bug tracking tool that allo...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" </tr>
\n
"
,
" </tbody>
\n
"
,
"</table>
\n
"
,
"</div>
\n
"
,
" <div class=
\"
colab-df-buttons
\"
>
\n
"
,
"
\n
"
,
" <div class=
\"
colab-df-container
\"
>
\n
"
,
" <button class=
\"
colab-df-convert
\"
onclick=
\"
convertToInteractive('df-65fab58d-70aa-44dc-b052-21323b44bec0')
\"\n
"
,
" title=
\"
Convert this dataframe to an interactive table.
\"\n
"
,
" style=
\"
display:none;
\"
>
\n
"
,
"
\n
"
,
" <svg xmlns=
\"
http://www.w3.org/2000/svg
\"
height=
\"
24px
\"
viewBox=
\"
0 -960 960 960
\"
>
\n
"
,
" <path d=
\"
M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z
\"
/>
\n
"
,
" </svg>
\n
"
,
" </button>
\n
"
,
"
\n
"
,
" <style>
\n
"
,
" .colab-df-container {\n"
,
" display:flex;
\n
"
,
" gap: 12px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-convert {\n"
,
" background-color: #E8F0FE;
\n
"
,
" border: none;
\n
"
,
" border-radius: 50%;
\n
"
,
" cursor: pointer;
\n
"
,
" display: none;
\n
"
,
" fill: #1967D2;
\n
"
,
" height: 32px;
\n
"
,
" padding: 0 0 0 0;
\n
"
,
" width: 32px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-convert:hover {\n"
,
" background-color: #E2EBFA;
\n
"
,
" box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);
\n
"
,
" fill: #174EA6;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-buttons div {\n"
,
" margin-bottom: 4px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-convert {\n"
,
" background-color: #3B4455;
\n
"
,
" fill: #D2E3FC;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-convert:hover {\n"
,
" background-color: #434B5C;
\n
"
,
" box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);
\n
"
,
" filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));
\n
"
,
" fill: #FFFFFF;
\n
"
,
" }
\n
"
,
" </style>
\n
"
,
"
\n
"
,
" <script>
\n
"
,
" const buttonEl =
\n
"
,
" document.querySelector('#df-65fab58d-70aa-44dc-b052-21323b44bec0 button.colab-df-convert');
\n
"
,
" buttonEl.style.display =
\n
"
,
" google.colab.kernel.accessAllowed ? 'block' : 'none';
\n
"
,
"
\n
"
,
" async function convertToInteractive(key) {\n"
,
" const element = document.querySelector('#df-65fab58d-70aa-44dc-b052-21323b44bec0');
\n
"
,
" const dataTable =
\n
"
,
" await google.colab.kernel.invokeFunction('convertToInteractive',
\n
"
,
" [key], {});
\n
"
,
" if (!dataTable) return;
\n
"
,
"
\n
"
,
" const docLinkHtml = 'Like what you see? Visit the ' +
\n
"
,
" '<a target=
\"
_blank
\"
href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'
\n
"
,
" + ' to learn more about interactive tables.';
\n
"
,
" element.innerHTML = '';
\n
"
,
" dataTable['output_type'] = 'display_data';
\n
"
,
" await google.colab.output.renderOutput(dataTable, element);
\n
"
,
" const docLink = document.createElement('div');
\n
"
,
" docLink.innerHTML = docLinkHtml;
\n
"
,
" element.appendChild(docLink);
\n
"
,
" }
\n
"
,
" </script>
\n
"
,
" </div>
\n
"
,
"
\n
"
,
"
\n
"
,
"<div id=
\"
df-1451cc01-be01-4fc6-b22d-3ae6b9dcce52
\"
>
\n
"
,
" <button class=
\"
colab-df-quickchart
\"
onclick=
\"
quickchart('df-1451cc01-be01-4fc6-b22d-3ae6b9dcce52')
\"\n
"
,
" title=
\"
Suggest charts.
\"\n
"
,
" style=
\"
display:none;
\"
>
\n
"
,
"
\n
"
,
"<svg xmlns=
\"
http://www.w3.org/2000/svg
\"
height=
\"
24px
\"
viewBox=
\"
0 0 24 24
\"\n
"
,
" width=
\"
24px
\"
>
\n
"
,
" <g>
\n
"
,
" <path d=
\"
M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z
\"
/>
\n
"
,
" </g>
\n
"
,
"</svg>
\n
"
,
" </button>
\n
"
,
"
\n
"
,
"<style>
\n
"
,
" .colab-df-quickchart {\n"
,
" --bg-color: #E8F0FE;
\n
"
,
" --fill-color: #1967D2;
\n
"
,
" --hover-bg-color: #E2EBFA;
\n
"
,
" --hover-fill-color: #174EA6;
\n
"
,
" --disabled-fill-color: #AAA;
\n
"
,
" --disabled-bg-color: #DDD;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-quickchart {\n"
,
" --bg-color: #3B4455;
\n
"
,
" --fill-color: #D2E3FC;
\n
"
,
" --hover-bg-color: #434B5C;
\n
"
,
" --hover-fill-color: #FFFFFF;
\n
"
,
" --disabled-bg-color: #3B4455;
\n
"
,
" --disabled-fill-color: #666;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart {\n"
,
" background-color: var(--bg-color);
\n
"
,
" border: none;
\n
"
,
" border-radius: 50%;
\n
"
,
" cursor: pointer;
\n
"
,
" display: none;
\n
"
,
" fill: var(--fill-color);
\n
"
,
" height: 32px;
\n
"
,
" padding: 0;
\n
"
,
" width: 32px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart:hover {\n"
,
" background-color: var(--hover-bg-color);
\n
"
,
" box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);
\n
"
,
" fill: var(--button-hover-fill-color);
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart-complete:disabled,
\n
"
,
" .colab-df-quickchart-complete:disabled:hover {\n"
,
" background-color: var(--disabled-bg-color);
\n
"
,
" fill: var(--disabled-fill-color);
\n
"
,
" box-shadow: none;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-spinner {\n"
,
" border: 2px solid var(--fill-color);
\n
"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" animation:
\n
"
,
" spin 1s steps(1) infinite;
\n
"
,
" }
\n
"
,
"
\n
"
,
" @keyframes spin {\n"
,
" 0% {\n"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 20% {\n"
,
" border-color: transparent;
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 30% {\n"
,
" border-color: transparent;
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 40% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 60% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 80% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 90% {\n"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" }
\n
"
,
"</style>
\n
"
,
"
\n
"
,
" <script>
\n
"
,
" async function quickchart(key) {\n"
,
" const quickchartButtonEl =
\n
"
,
" document.querySelector('#' + key + ' button');
\n
"
,
" quickchartButtonEl.disabled = true; // To prevent multiple clicks.
\n
"
,
" quickchartButtonEl.classList.add('colab-df-spinner');
\n
"
,
" try {\n"
,
" const charts = await google.colab.kernel.invokeFunction(
\n
"
,
" 'suggestCharts', [key], {});
\n
"
,
" } catch (error) {\n"
,
" console.error('Error during call to suggestCharts:', error);
\n
"
,
" }
\n
"
,
" quickchartButtonEl.classList.remove('colab-df-spinner');
\n
"
,
" quickchartButtonEl.classList.add('colab-df-quickchart-complete');
\n
"
,
" }
\n
"
,
" (() => {\n"
,
" let quickchartButtonEl =
\n
"
,
" document.querySelector('#df-1451cc01-be01-4fc6-b22d-3ae6b9dcce52 button');
\n
"
,
" quickchartButtonEl.style.display =
\n
"
,
" google.colab.kernel.accessAllowed ? 'block' : 'none';
\n
"
,
" })();
\n
"
,
" </script>
\n
"
,
"</div>
\n
"
,
" </div>
\n
"
,
" </div>
\n
"
]
},
"metadata"
:
{},
"execution_count"
:
5
}
],
"source"
:
[
"#import data
\n
"
,
"df = pd.read_csv(
\"
/content/drive/MyDrive/PP1 Practice/TaskDescCopy3.csv
\"
)
\n
"
,
"
\n
"
,
"#inspect dataset
\n
"
,
"df.head()"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
,
"height"
:
210
},
"id"
:
"N7VfsALBt7E1"
,
"outputId"
:
"bf9728f0-4cb3-4ab1-c280-35d27c427a98"
},
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
" ProjectName
\\\n
"
,
" count unique top freq
\n
"
,
"Level
\n
"
,
"High 54 47 Recommendation System Evaluation 2
\n
"
,
"Low 94 82 Progressive Web Application 2
\n
"
,
"
\n
"
,
" TaskDescription
\\\n
"
,
" count unique
\n
"
,
"Level
\n
"
,
"High 54 47
\n
"
,
"Low 94 84
\n
"
,
"
\n
"
,
"
\n
"
,
" top freq
\n
"
,
"Level
\n
"
,
"High Evaluate and fine-tune the performance of a re... 2
\n
"
,
"Low Develop a custom data visualization library fo... 2 "
],
"text/html"
:
[
"
\n
"
,
" <div id=
\"
df-03695561-a5c6-4a46-bad1-590895806da8
\"
class=
\"
colab-df-container
\"
>
\n
"
,
" <div>
\n
"
,
"<style scoped>
\n
"
,
" .dataframe tbody tr th:only-of-type {\n"
,
" vertical-align: middle;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe tbody tr th {\n"
,
" vertical-align: top;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe thead tr th {\n"
,
" text-align: left;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe thead tr:last-of-type th {\n"
,
" text-align: right;
\n
"
,
" }
\n
"
,
"</style>
\n
"
,
"<table border=
\"
1
\"
class=
\"
dataframe
\"
>
\n
"
,
" <thead>
\n
"
,
" <tr>
\n
"
,
" <th></th>
\n
"
,
" <th colspan=
\"
4
\"
halign=
\"
left
\"
>ProjectName</th>
\n
"
,
" <th colspan=
\"
4
\"
halign=
\"
left
\"
>TaskDescription</th>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th></th>
\n
"
,
" <th>count</th>
\n
"
,
" <th>unique</th>
\n
"
,
" <th>top</th>
\n
"
,
" <th>freq</th>
\n
"
,
" <th>count</th>
\n
"
,
" <th>unique</th>
\n
"
,
" <th>top</th>
\n
"
,
" <th>freq</th>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>Level</th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" <th></th>
\n
"
,
" </tr>
\n
"
,
" </thead>
\n
"
,
" <tbody>
\n
"
,
" <tr>
\n
"
,
" <th>High</th>
\n
"
,
" <td>54</td>
\n
"
,
" <td>47</td>
\n
"
,
" <td>Recommendation System Evaluation</td>
\n
"
,
" <td>2</td>
\n
"
,
" <td>54</td>
\n
"
,
" <td>47</td>
\n
"
,
" <td>Evaluate and fine-tune the performance of a re...</td>
\n
"
,
" <td>2</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>Low</th>
\n
"
,
" <td>94</td>
\n
"
,
" <td>82</td>
\n
"
,
" <td>Progressive Web Application</td>
\n
"
,
" <td>2</td>
\n
"
,
" <td>94</td>
\n
"
,
" <td>84</td>
\n
"
,
" <td>Develop a custom data visualization library fo...</td>
\n
"
,
" <td>2</td>
\n
"
,
" </tr>
\n
"
,
" </tbody>
\n
"
,
"</table>
\n
"
,
"</div>
\n
"
,
" <div class=
\"
colab-df-buttons
\"
>
\n
"
,
"
\n
"
,
" <div class=
\"
colab-df-container
\"
>
\n
"
,
" <button class=
\"
colab-df-convert
\"
onclick=
\"
convertToInteractive('df-03695561-a5c6-4a46-bad1-590895806da8')
\"\n
"
,
" title=
\"
Convert this dataframe to an interactive table.
\"\n
"
,
" style=
\"
display:none;
\"
>
\n
"
,
"
\n
"
,
" <svg xmlns=
\"
http://www.w3.org/2000/svg
\"
height=
\"
24px
\"
viewBox=
\"
0 -960 960 960
\"
>
\n
"
,
" <path d=
\"
M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z
\"
/>
\n
"
,
" </svg>
\n
"
,
" </button>
\n
"
,
"
\n
"
,
" <style>
\n
"
,
" .colab-df-container {\n"
,
" display:flex;
\n
"
,
" gap: 12px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-convert {\n"
,
" background-color: #E8F0FE;
\n
"
,
" border: none;
\n
"
,
" border-radius: 50%;
\n
"
,
" cursor: pointer;
\n
"
,
" display: none;
\n
"
,
" fill: #1967D2;
\n
"
,
" height: 32px;
\n
"
,
" padding: 0 0 0 0;
\n
"
,
" width: 32px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-convert:hover {\n"
,
" background-color: #E2EBFA;
\n
"
,
" box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);
\n
"
,
" fill: #174EA6;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-buttons div {\n"
,
" margin-bottom: 4px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-convert {\n"
,
" background-color: #3B4455;
\n
"
,
" fill: #D2E3FC;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-convert:hover {\n"
,
" background-color: #434B5C;
\n
"
,
" box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);
\n
"
,
" filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));
\n
"
,
" fill: #FFFFFF;
\n
"
,
" }
\n
"
,
" </style>
\n
"
,
"
\n
"
,
" <script>
\n
"
,
" const buttonEl =
\n
"
,
" document.querySelector('#df-03695561-a5c6-4a46-bad1-590895806da8 button.colab-df-convert');
\n
"
,
" buttonEl.style.display =
\n
"
,
" google.colab.kernel.accessAllowed ? 'block' : 'none';
\n
"
,
"
\n
"
,
" async function convertToInteractive(key) {\n"
,
" const element = document.querySelector('#df-03695561-a5c6-4a46-bad1-590895806da8');
\n
"
,
" const dataTable =
\n
"
,
" await google.colab.kernel.invokeFunction('convertToInteractive',
\n
"
,
" [key], {});
\n
"
,
" if (!dataTable) return;
\n
"
,
"
\n
"
,
" const docLinkHtml = 'Like what you see? Visit the ' +
\n
"
,
" '<a target=
\"
_blank
\"
href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'
\n
"
,
" + ' to learn more about interactive tables.';
\n
"
,
" element.innerHTML = '';
\n
"
,
" dataTable['output_type'] = 'display_data';
\n
"
,
" await google.colab.output.renderOutput(dataTable, element);
\n
"
,
" const docLink = document.createElement('div');
\n
"
,
" docLink.innerHTML = docLinkHtml;
\n
"
,
" element.appendChild(docLink);
\n
"
,
" }
\n
"
,
" </script>
\n
"
,
" </div>
\n
"
,
"
\n
"
,
"
\n
"
,
"<div id=
\"
df-95404b73-c644-4d4d-9790-d47c084d8012
\"
>
\n
"
,
" <button class=
\"
colab-df-quickchart
\"
onclick=
\"
quickchart('df-95404b73-c644-4d4d-9790-d47c084d8012')
\"\n
"
,
" title=
\"
Suggest charts.
\"\n
"
,
" style=
\"
display:none;
\"
>
\n
"
,
"
\n
"
,
"<svg xmlns=
\"
http://www.w3.org/2000/svg
\"
height=
\"
24px
\"
viewBox=
\"
0 0 24 24
\"\n
"
,
" width=
\"
24px
\"
>
\n
"
,
" <g>
\n
"
,
" <path d=
\"
M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z
\"
/>
\n
"
,
" </g>
\n
"
,
"</svg>
\n
"
,
" </button>
\n
"
,
"
\n
"
,
"<style>
\n
"
,
" .colab-df-quickchart {\n"
,
" --bg-color: #E8F0FE;
\n
"
,
" --fill-color: #1967D2;
\n
"
,
" --hover-bg-color: #E2EBFA;
\n
"
,
" --hover-fill-color: #174EA6;
\n
"
,
" --disabled-fill-color: #AAA;
\n
"
,
" --disabled-bg-color: #DDD;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-quickchart {\n"
,
" --bg-color: #3B4455;
\n
"
,
" --fill-color: #D2E3FC;
\n
"
,
" --hover-bg-color: #434B5C;
\n
"
,
" --hover-fill-color: #FFFFFF;
\n
"
,
" --disabled-bg-color: #3B4455;
\n
"
,
" --disabled-fill-color: #666;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart {\n"
,
" background-color: var(--bg-color);
\n
"
,
" border: none;
\n
"
,
" border-radius: 50%;
\n
"
,
" cursor: pointer;
\n
"
,
" display: none;
\n
"
,
" fill: var(--fill-color);
\n
"
,
" height: 32px;
\n
"
,
" padding: 0;
\n
"
,
" width: 32px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart:hover {\n"
,
" background-color: var(--hover-bg-color);
\n
"
,
" box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);
\n
"
,
" fill: var(--button-hover-fill-color);
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart-complete:disabled,
\n
"
,
" .colab-df-quickchart-complete:disabled:hover {\n"
,
" background-color: var(--disabled-bg-color);
\n
"
,
" fill: var(--disabled-fill-color);
\n
"
,
" box-shadow: none;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-spinner {\n"
,
" border: 2px solid var(--fill-color);
\n
"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" animation:
\n
"
,
" spin 1s steps(1) infinite;
\n
"
,
" }
\n
"
,
"
\n
"
,
" @keyframes spin {\n"
,
" 0% {\n"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 20% {\n"
,
" border-color: transparent;
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 30% {\n"
,
" border-color: transparent;
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 40% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 60% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 80% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 90% {\n"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" }
\n
"
,
"</style>
\n
"
,
"
\n
"
,
" <script>
\n
"
,
" async function quickchart(key) {\n"
,
" const quickchartButtonEl =
\n
"
,
" document.querySelector('#' + key + ' button');
\n
"
,
" quickchartButtonEl.disabled = true; // To prevent multiple clicks.
\n
"
,
" quickchartButtonEl.classList.add('colab-df-spinner');
\n
"
,
" try {\n"
,
" const charts = await google.colab.kernel.invokeFunction(
\n
"
,
" 'suggestCharts', [key], {});
\n
"
,
" } catch (error) {\n"
,
" console.error('Error during call to suggestCharts:', error);
\n
"
,
" }
\n
"
,
" quickchartButtonEl.classList.remove('colab-df-spinner');
\n
"
,
" quickchartButtonEl.classList.add('colab-df-quickchart-complete');
\n
"
,
" }
\n
"
,
" (() => {\n"
,
" let quickchartButtonEl =
\n
"
,
" document.querySelector('#df-95404b73-c644-4d4d-9790-d47c084d8012 button');
\n
"
,
" quickchartButtonEl.style.display =
\n
"
,
" google.colab.kernel.accessAllowed ? 'block' : 'none';
\n
"
,
" })();
\n
"
,
" </script>
\n
"
,
"</div>
\n
"
,
" </div>
\n
"
,
" </div>
\n
"
]
},
"metadata"
:
{},
"execution_count"
:
6
}
],
"source"
:
[
"df.groupby('Level').describe()"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"id"
:
"N55IenEMBV85"
},
"outputs"
:
[],
"source"
:
[
"df['high'] = df['Level'].apply(lambda x: 1 if x == 'High' else 0)"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
,
"height"
:
424
},
"id"
:
"CpYAkj8iDqum"
,
"outputId"
:
"337669eb-4119-4c77-fb75-a397ecd83764"
},
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
" ProjectName
\\\n
"
,
"0 E-commerce Website
\n
"
,
"1 Mobile App Development
\n
"
,
"2 Data Analytics Platform
\n
"
,
"3 CRM System Upgrade
\n
"
,
"4 Bug Tracking Tool
\n
"
,
".. ...
\n
"
,
"143 Gamification Feature
\n
"
,
"144 Natural Language Understanding
\n
"
,
"145 Conversational Surveys
\n
"
,
"146 Data Privacy Impact Assessment
\n
"
,
"147 A/B Testing Platform
\n
"
,
"
\n
"
,
" TaskDescription Level high
\n
"
,
"0 Implement a user registration and login system... Low 0
\n
"
,
"1 Develop a push notification feature for the mo... Low 0
\n
"
,
"2 Build a data visualization module that present... Low 0
\n
"
,
"3 Enhance the existing customer relationship man... Low 0
\n
"
,
"4 Create a web-based bug tracking tool that allo... Low 0
\n
"
,
".. ... ... ...
\n
"
,
"143 Implement gamification features to enhance use... Low 0
\n
"
,
"144 Implement natural language understanding (NLU)... Low 0
\n
"
,
"145 Develop conversational surveys to collect feed... Low 0
\n
"
,
"146 Conduct a data privacy impact assessment (DPIA... High 1
\n
"
,
"147 Design and develop an A/B testing platform for... Low 0
\n
"
,
"
\n
"
,
"[148 rows x 4 columns]"
],
"text/html"
:
[
"
\n
"
,
" <div id=
\"
df-05b5924d-8eb6-41e7-bd96-af2144ab6f3f
\"
class=
\"
colab-df-container
\"
>
\n
"
,
" <div>
\n
"
,
"<style scoped>
\n
"
,
" .dataframe tbody tr th:only-of-type {\n"
,
" vertical-align: middle;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe tbody tr th {\n"
,
" vertical-align: top;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .dataframe thead th {\n"
,
" text-align: right;
\n
"
,
" }
\n
"
,
"</style>
\n
"
,
"<table border=
\"
1
\"
class=
\"
dataframe
\"
>
\n
"
,
" <thead>
\n
"
,
" <tr style=
\"
text-align: right;
\"
>
\n
"
,
" <th></th>
\n
"
,
" <th>ProjectName</th>
\n
"
,
" <th>TaskDescription</th>
\n
"
,
" <th>Level</th>
\n
"
,
" <th>high</th>
\n
"
,
" </tr>
\n
"
,
" </thead>
\n
"
,
" <tbody>
\n
"
,
" <tr>
\n
"
,
" <th>0</th>
\n
"
,
" <td>E-commerce Website</td>
\n
"
,
" <td>Implement a user registration and login system...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>1</th>
\n
"
,
" <td>Mobile App Development</td>
\n
"
,
" <td>Develop a push notification feature for the mo...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>2</th>
\n
"
,
" <td>Data Analytics Platform</td>
\n
"
,
" <td>Build a data visualization module that present...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>3</th>
\n
"
,
" <td>CRM System Upgrade</td>
\n
"
,
" <td>Enhance the existing customer relationship man...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>4</th>
\n
"
,
" <td>Bug Tracking Tool</td>
\n
"
,
" <td>Create a web-based bug tracking tool that allo...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>...</th>
\n
"
,
" <td>...</td>
\n
"
,
" <td>...</td>
\n
"
,
" <td>...</td>
\n
"
,
" <td>...</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>143</th>
\n
"
,
" <td>Gamification Feature</td>
\n
"
,
" <td>Implement gamification features to enhance use...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>144</th>
\n
"
,
" <td>Natural Language Understanding</td>
\n
"
,
" <td>Implement natural language understanding (NLU)...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>145</th>
\n
"
,
" <td>Conversational Surveys</td>
\n
"
,
" <td>Develop conversational surveys to collect feed...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>146</th>
\n
"
,
" <td>Data Privacy Impact Assessment</td>
\n
"
,
" <td>Conduct a data privacy impact assessment (DPIA...</td>
\n
"
,
" <td>High</td>
\n
"
,
" <td>1</td>
\n
"
,
" </tr>
\n
"
,
" <tr>
\n
"
,
" <th>147</th>
\n
"
,
" <td>A/B Testing Platform</td>
\n
"
,
" <td>Design and develop an A/B testing platform for...</td>
\n
"
,
" <td>Low</td>
\n
"
,
" <td>0</td>
\n
"
,
" </tr>
\n
"
,
" </tbody>
\n
"
,
"</table>
\n
"
,
"<p>148 rows × 4 columns</p>
\n
"
,
"</div>
\n
"
,
" <div class=
\"
colab-df-buttons
\"
>
\n
"
,
"
\n
"
,
" <div class=
\"
colab-df-container
\"
>
\n
"
,
" <button class=
\"
colab-df-convert
\"
onclick=
\"
convertToInteractive('df-05b5924d-8eb6-41e7-bd96-af2144ab6f3f')
\"\n
"
,
" title=
\"
Convert this dataframe to an interactive table.
\"\n
"
,
" style=
\"
display:none;
\"
>
\n
"
,
"
\n
"
,
" <svg xmlns=
\"
http://www.w3.org/2000/svg
\"
height=
\"
24px
\"
viewBox=
\"
0 -960 960 960
\"
>
\n
"
,
" <path d=
\"
M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z
\"
/>
\n
"
,
" </svg>
\n
"
,
" </button>
\n
"
,
"
\n
"
,
" <style>
\n
"
,
" .colab-df-container {\n"
,
" display:flex;
\n
"
,
" gap: 12px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-convert {\n"
,
" background-color: #E8F0FE;
\n
"
,
" border: none;
\n
"
,
" border-radius: 50%;
\n
"
,
" cursor: pointer;
\n
"
,
" display: none;
\n
"
,
" fill: #1967D2;
\n
"
,
" height: 32px;
\n
"
,
" padding: 0 0 0 0;
\n
"
,
" width: 32px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-convert:hover {\n"
,
" background-color: #E2EBFA;
\n
"
,
" box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);
\n
"
,
" fill: #174EA6;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-buttons div {\n"
,
" margin-bottom: 4px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-convert {\n"
,
" background-color: #3B4455;
\n
"
,
" fill: #D2E3FC;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-convert:hover {\n"
,
" background-color: #434B5C;
\n
"
,
" box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);
\n
"
,
" filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));
\n
"
,
" fill: #FFFFFF;
\n
"
,
" }
\n
"
,
" </style>
\n
"
,
"
\n
"
,
" <script>
\n
"
,
" const buttonEl =
\n
"
,
" document.querySelector('#df-05b5924d-8eb6-41e7-bd96-af2144ab6f3f button.colab-df-convert');
\n
"
,
" buttonEl.style.display =
\n
"
,
" google.colab.kernel.accessAllowed ? 'block' : 'none';
\n
"
,
"
\n
"
,
" async function convertToInteractive(key) {\n"
,
" const element = document.querySelector('#df-05b5924d-8eb6-41e7-bd96-af2144ab6f3f');
\n
"
,
" const dataTable =
\n
"
,
" await google.colab.kernel.invokeFunction('convertToInteractive',
\n
"
,
" [key], {});
\n
"
,
" if (!dataTable) return;
\n
"
,
"
\n
"
,
" const docLinkHtml = 'Like what you see? Visit the ' +
\n
"
,
" '<a target=
\"
_blank
\"
href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'
\n
"
,
" + ' to learn more about interactive tables.';
\n
"
,
" element.innerHTML = '';
\n
"
,
" dataTable['output_type'] = 'display_data';
\n
"
,
" await google.colab.output.renderOutput(dataTable, element);
\n
"
,
" const docLink = document.createElement('div');
\n
"
,
" docLink.innerHTML = docLinkHtml;
\n
"
,
" element.appendChild(docLink);
\n
"
,
" }
\n
"
,
" </script>
\n
"
,
" </div>
\n
"
,
"
\n
"
,
"
\n
"
,
"<div id=
\"
df-63938025-cce3-48cd-80a4-282bf55d5152
\"
>
\n
"
,
" <button class=
\"
colab-df-quickchart
\"
onclick=
\"
quickchart('df-63938025-cce3-48cd-80a4-282bf55d5152')
\"\n
"
,
" title=
\"
Suggest charts.
\"\n
"
,
" style=
\"
display:none;
\"
>
\n
"
,
"
\n
"
,
"<svg xmlns=
\"
http://www.w3.org/2000/svg
\"
height=
\"
24px
\"
viewBox=
\"
0 0 24 24
\"\n
"
,
" width=
\"
24px
\"
>
\n
"
,
" <g>
\n
"
,
" <path d=
\"
M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z
\"
/>
\n
"
,
" </g>
\n
"
,
"</svg>
\n
"
,
" </button>
\n
"
,
"
\n
"
,
"<style>
\n
"
,
" .colab-df-quickchart {\n"
,
" --bg-color: #E8F0FE;
\n
"
,
" --fill-color: #1967D2;
\n
"
,
" --hover-bg-color: #E2EBFA;
\n
"
,
" --hover-fill-color: #174EA6;
\n
"
,
" --disabled-fill-color: #AAA;
\n
"
,
" --disabled-bg-color: #DDD;
\n
"
,
" }
\n
"
,
"
\n
"
,
" [theme=dark] .colab-df-quickchart {\n"
,
" --bg-color: #3B4455;
\n
"
,
" --fill-color: #D2E3FC;
\n
"
,
" --hover-bg-color: #434B5C;
\n
"
,
" --hover-fill-color: #FFFFFF;
\n
"
,
" --disabled-bg-color: #3B4455;
\n
"
,
" --disabled-fill-color: #666;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart {\n"
,
" background-color: var(--bg-color);
\n
"
,
" border: none;
\n
"
,
" border-radius: 50%;
\n
"
,
" cursor: pointer;
\n
"
,
" display: none;
\n
"
,
" fill: var(--fill-color);
\n
"
,
" height: 32px;
\n
"
,
" padding: 0;
\n
"
,
" width: 32px;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart:hover {\n"
,
" background-color: var(--hover-bg-color);
\n
"
,
" box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);
\n
"
,
" fill: var(--button-hover-fill-color);
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-quickchart-complete:disabled,
\n
"
,
" .colab-df-quickchart-complete:disabled:hover {\n"
,
" background-color: var(--disabled-bg-color);
\n
"
,
" fill: var(--disabled-fill-color);
\n
"
,
" box-shadow: none;
\n
"
,
" }
\n
"
,
"
\n
"
,
" .colab-df-spinner {\n"
,
" border: 2px solid var(--fill-color);
\n
"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" animation:
\n
"
,
" spin 1s steps(1) infinite;
\n
"
,
" }
\n
"
,
"
\n
"
,
" @keyframes spin {\n"
,
" 0% {\n"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 20% {\n"
,
" border-color: transparent;
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 30% {\n"
,
" border-color: transparent;
\n
"
,
" border-left-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 40% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" border-top-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 60% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 80% {\n"
,
" border-color: transparent;
\n
"
,
" border-right-color: var(--fill-color);
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" 90% {\n"
,
" border-color: transparent;
\n
"
,
" border-bottom-color: var(--fill-color);
\n
"
,
" }
\n
"
,
" }
\n
"
,
"</style>
\n
"
,
"
\n
"
,
" <script>
\n
"
,
" async function quickchart(key) {\n"
,
" const quickchartButtonEl =
\n
"
,
" document.querySelector('#' + key + ' button');
\n
"
,
" quickchartButtonEl.disabled = true; // To prevent multiple clicks.
\n
"
,
" quickchartButtonEl.classList.add('colab-df-spinner');
\n
"
,
" try {\n"
,
" const charts = await google.colab.kernel.invokeFunction(
\n
"
,
" 'suggestCharts', [key], {});
\n
"
,
" } catch (error) {\n"
,
" console.error('Error during call to suggestCharts:', error);
\n
"
,
" }
\n
"
,
" quickchartButtonEl.classList.remove('colab-df-spinner');
\n
"
,
" quickchartButtonEl.classList.add('colab-df-quickchart-complete');
\n
"
,
" }
\n
"
,
" (() => {\n"
,
" let quickchartButtonEl =
\n
"
,
" document.querySelector('#df-63938025-cce3-48cd-80a4-282bf55d5152 button');
\n
"
,
" quickchartButtonEl.style.display =
\n
"
,
" google.colab.kernel.accessAllowed ? 'block' : 'none';
\n
"
,
" })();
\n
"
,
" </script>
\n
"
,
"</div>
\n
"
,
" </div>
\n
"
,
" </div>
\n
"
]
},
"metadata"
:
{},
"execution_count"
:
8
}
],
"source"
:
[
"df"
]
},
{
"cell_type"
:
"code"
,
"execution_count"
:
null
,
"metadata"
:
{
"id"
:
"9XVubeEMDwJN"
},
"outputs"
:
[],
"source"
:
[
"#train test split
\n
"
,
"x_train, x_test, y_train, y_test = train_test_split(df.TaskDescription, df.high, test_size=0.2)"
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"x_train"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"XkomH8f2215K"
,
"outputId"
:
"e56869db-7caa-4fca-d370-38fa26c1f2cd"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"127 Optimize cloud costs by analyzing resource usa...
\n
"
,
"111 Design and develop an A/B testing platform for...
\n
"
,
"146 Conduct a data privacy impact assessment (DPIA...
\n
"
,
"90 Implement a speech recognition system to conve...
\n
"
,
"45 Develop an inventory management system to trac...
\n
"
,
" ...
\n
"
,
"18 Redesign the company website to make it more m...
\n
"
,
"123 Implement voice biometrics for user authentica...
\n
"
,
"129 Perform sales funnel analysis to identify bott...
\n
"
,
"3 Enhance the existing customer relationship man...
\n
"
,
"39 Develop a chatbot feature for customer support...
\n
"
,
"Name: TaskDescription, Length: 118, dtype: object"
]
},
"metadata"
:
{},
"execution_count"
:
10
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"x_train.describe()"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"hAaehk3024w2"
,
"outputId"
:
"694b3746-a488-4081-b7ae-f3290e300772"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"count 118
\n
"
,
"unique 109
\n
"
,
"top Design and implement a data lake architecture ...
\n
"
,
"freq 2
\n
"
,
"Name: TaskDescription, dtype: object"
]
},
"metadata"
:
{},
"execution_count"
:
11
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#find the word count and storing data in a numerical matrix
\n
"
,
"cv = CountVectorizer()
\n
"
,
"x_train_count = cv.fit_transform(x_train.values) #turning the descriptions in train dataset into a matrix
\n
"
],
"metadata"
:
{
"id"
:
"_td_dr0s3CBN"
},
"execution_count"
:
null
,
"outputs"
:
[]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"x_train_count"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"S5ufUn1-4dpf"
,
"outputId"
:
"898b7896-84b8-4aec-843b-01fd75a40b37"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"<118x798 sparse matrix of type '<class 'numpy.int64'>'
\n
"
,
"
\t
with 2333 stored elements in Compressed Sparse Row format>"
]
},
"metadata"
:
{},
"execution_count"
:
13
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"x_train_count.toarray()"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"n5WzCLqX4h9M"
,
"outputId"
:
"a76ef34f-2172-4db1-9894-7c1e9e579337"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"array([[0, 0, 0, ..., 0, 0, 0],
\n
"
,
" [0, 0, 0, ..., 0, 0, 0],
\n
"
,
" [0, 0, 0, ..., 0, 0, 0],
\n
"
,
" ...,
\n
"
,
" [0, 0, 0, ..., 0, 0, 0],
\n
"
,
" [0, 0, 0, ..., 0, 0, 0],
\n
"
,
" [0, 0, 0, ..., 0, 0, 0]])"
]
},
"metadata"
:
{},
"execution_count"
:
14
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#train model
\n
"
,
"model = MultinomialNB()
\n
"
,
"model.fit(x_train_count, y_train) #training the model using our converted x train value set and y_train data"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
,
"height"
:
75
},
"id"
:
"OejJluIB4pO8"
,
"outputId"
:
"f7ddef8e-ff54-4716-e005-e204644b0491"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"MultinomialNB()"
],
"text/html"
:
[
"<style>#sk-container-id-1 {color: black;background-color: white;}#sk-container-id-1 pre{padding: 0;}#sk-container-id-1 div.sk-toggleable {background-color: white;}#sk-container-id-1 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-1 label.sk-toggleable__label-arrow:before {content:
\"
▸
\"
;float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-1 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-1 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-1 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-1 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-1 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-1 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content:
\"
▾
\"
;}#sk-container-id-1 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-1 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-1 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-1 div.sk-parallel-item::after {content:
\"\"
;width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-1 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 div.sk-serial::before {content:
\"\"
;position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-1 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-1 div.sk-item {position: relative;z-index: 1;}#sk-container-id-1 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-1 div.sk-item::before, #sk-container-id-1 div.sk-parallel-item::before {content:
\"\"
;position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-1 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-1 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-1 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-1 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-1 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-1 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-1 div.sk-label-container {text-align: center;}#sk-container-id-1 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-1 div.sk-text-repr-fallback {display: none;}</style><div id=
\"
sk-container-id-1
\"
class=
\"
sk-top-container
\"
><div class=
\"
sk-text-repr-fallback
\"
><pre>MultinomialNB()</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=
\"
sk-container
\"
hidden><div class=
\"
sk-item
\"
><div class=
\"
sk-estimator sk-toggleable
\"
><input class=
\"
sk-toggleable__control sk-hidden--visually
\"
id=
\"
sk-estimator-id-1
\"
type=
\"
checkbox
\"
checked><label for=
\"
sk-estimator-id-1
\"
class=
\"
sk-toggleable__label sk-toggleable__label-arrow
\"
>MultinomialNB</label><div class=
\"
sk-toggleable__content
\"
><pre>MultinomialNB()</pre></div></div></div></div></div>"
]
},
"metadata"
:
{},
"execution_count"
:
15
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#validation
\n
"
,
"task1 = [
\"
Machine learning pplatform to predict Cardiac Diseases
\"
]
\n
"
,
"task1_count = cv.transform(task1) #Using CountVectorizer Function
\n
"
,
"model.predict(task1_count)"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"5w0z9Rt47nGS"
,
"outputId"
:
"a2b3d4aa-70dc-4ba6-a90e-7d08de4f9d34"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"array([1])"
]
},
"metadata"
:
{},
"execution_count"
:
16
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#validation
\n
"
,
"task2 = [
\"
Refactor a code
\"
]
\n
"
,
"task2_count = cv.transform(task2) #Using CountVectorizer Function conversion is done
\n
"
,
"model.predict(task2_count)"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"bzZMZ3G58Oco"
,
"outputId"
:
"e4dbf420-4d6b-4ff8-b67a-4f406b0def0d"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"array([0])"
]
},
"metadata"
:
{},
"execution_count"
:
17
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#testing the model
\n
"
,
"x_test_count = cv.transform(x_test) #converting test data to matrix form
\n
"
,
"model.score(x_test_count, y_test) #testing against the y labels of the testing data"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"8rEHDqXF9BoP"
,
"outputId"
:
"4b28b1d8-ff18-4eea-ab00-27719e8d8439"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"0.8333333333333334"
]
},
"metadata"
:
{},
"execution_count"
:
18
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#make predictions using testing data
\n
"
,
"y_pred = model.predict(x_test_count)"
],
"metadata"
:
{
"id"
:
"qWGXwN2X9y-W"
},
"execution_count"
:
null
,
"outputs"
:
[]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"#Evaluate the performance of the classifier
\n
"
,
"print(classification_report(y_test,y_pred))"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"kPbI2biv-g-F"
,
"outputId"
:
"1920de39-9ab0-4035-8b54-25eec764d369"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
" precision recall f1-score support
\n
"
,
"
\n
"
,
" 0 0.89 0.84 0.86 19
\n
"
,
" 1 0.75 0.82 0.78 11
\n
"
,
"
\n
"
,
" accuracy 0.83 30
\n
"
,
" macro avg 0.82 0.83 0.82 30
\n
"
,
"weighted avg 0.84 0.83 0.83 30
\n
"
,
"
\n
"
]
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"# Calculate the accuracy of the model
\n
"
,
"accuracy = accuracy_score(y_test, y_pred)
\n
"
,
"print(
\"
Accuracy:
\"
, accuracy)"
],
"metadata"
:
{
"id"
:
"thbdaDaA-tsF"
,
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"outputId"
:
"f6f373c6-0057-43eb-e1f4-ddaaf1860675"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
"Accuracy: 0.8333333333333334
\n
"
]
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"from sklearn.metrics import f1_score
\n
"
,
"f1 = f1_score(y_test, y_pred)
\n
"
,
"print(
\"
F1 score:
\"
, f1)"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"favBrnZWJnLt"
,
"outputId"
:
"a22dc8c6-fdab-4e8a-867a-67e8107983cf"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
"F1 score: 0.7826086956521738
\n
"
]
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"from sklearn.metrics import recall_score
\n
"
,
"recall = recall_score(y_test, y_pred)
\n
"
,
"print(
\"
Recall:
\"
, recall)"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"Scr5KlNdJ5xw"
,
"outputId"
:
"cfedfba5-a751-4876-c201-0202bff54196"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
"Recall: 0.8181818181818182
\n
"
]
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"from sklearn.metrics import precision_score
\n
"
,
"precision = precision_score(y_test, y_pred)
\n
"
,
"print(
\"
Precision:
\"
, precision)"
],
"metadata"
:
{
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
},
"id"
:
"5Th4pX7NKqF2"
,
"outputId"
:
"21fb8a68-6405-438e-cafc-4536b7ff4158"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"stream"
,
"name"
:
"stdout"
,
"text"
:
[
"Precision: 0.75
\n
"
]
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"from sklearn.metrics import accuracy_score,confusion_matrix
\n
"
,
"import matplotlib.pyplot as plt
\n
"
,
"import seaborn as sns"
],
"metadata"
:
{
"id"
:
"o7clj6nahd4E"
},
"execution_count"
:
null
,
"outputs"
:
[]
},
{
"cell_type"
:
"code"
,
"source"
:
[
"cm=confusion_matrix(y_test,y_pred)
\n
"
,
"fig=plt.figure(figsize=(12,8))
\n
"
,
"sns.heatmap(
\n
"
,
" cm,
\n
"
,
" annot=True,
\n
"
,
")
\n
"
,
"plt.title(
\"
Confusion Matrix for Naive Bayes Classifier
\"
)
\n
"
,
"cm"
],
"metadata"
:
{
"id"
:
"mWEuzWnZLiPN"
,
"colab"
:
{
"base_uri"
:
"https://localhost:8080/"
,
"height"
:
691
},
"outputId"
:
"4723b7fb-4caf-427c-8959-54dfe5f8d9a2"
},
"execution_count"
:
null
,
"outputs"
:
[
{
"output_type"
:
"execute_result"
,
"data"
:
{
"text/plain"
:
[
"array([[16, 3],
\n
"
,
" [ 2, 9]])"
]
},
"metadata"
:
{},
"execution_count"
:
31
},
{
"output_type"
:
"display_data"
,
"data"
:
{
"text/plain"
:
[
"<Figure size 1200x800 with 2 Axes>"
],
"image/png"
:
"
\n
"
},
"metadata"
:
{}
}
]
},
{
"cell_type"
:
"code"
,
"source"
:
[],
"metadata"
:
{
"id"
:
"DkNbZ5zbhLBc"
},
"execution_count"
:
null
,
"outputs"
:
[]
}
],
"metadata"
:
{
"colab"
:
{
"provenance"
:
[]
},
"kernelspec"
:
{
"display_name"
:
"Python 3"
,
"name"
:
"python3"
},
"language_info"
:
{
"name"
:
"python"
}
},
"nbformat"
:
4
,
"nbformat_minor"
:
0
}
\ No newline at end of file
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment