Commit 8ceb3408 authored by Anuththara18's avatar Anuththara18

clustering model files added

parent 9fb2698c
This source diff could not be displayed because it is too large. You can view the blob instead.
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "bcdc5589",
"metadata": {},
"outputs": [],
"source": [
"# importing libraries \n",
"import numpy as nm \n",
"import matplotlib.pyplot as mtp \n",
"import pandas as pd \n",
"from sklearn.cluster import DBSCAN\n",
"from numpy import unique\n",
"from numpy import where\n",
"from matplotlib import pyplot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "f448f999",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>child_gender</th>\n",
" <th>child_age</th>\n",
" <th>total_correct_responses</th>\n",
" <th>correct_responses</th>\n",
" <th>commission_errors</th>\n",
" <th>omission_errors</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>total_duration</th>\n",
" <th>diagnosis</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>game</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>23</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1023</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>24</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1397</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>25</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>961</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>52.631579</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25</th>\n",
" <td>26</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>804</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>42.105263</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>27</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1180</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>57.894737</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>28</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>18</td>\n",
" <td>2</td>\n",
" <td>1</td>\n",
" <td>994</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>10.526316</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>29</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>18</td>\n",
" <td>3</td>\n",
" <td>1</td>\n",
" <td>448</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>15.789474</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>29</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>18</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>733</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>36.842105</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>30</th>\n",
" <td>29</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>19</td>\n",
" <td>18</td>\n",
" <td>5</td>\n",
" <td>1</td>\n",
" <td>1083</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>26.315789</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>31</th>\n",
" <td>29</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>15</td>\n",
" <td>0</td>\n",
" <td>771</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>78.947368</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>32</th>\n",
" <td>30</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>18</td>\n",
" <td>9</td>\n",
" <td>1</td>\n",
" <td>668</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>47.368421</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>33</th>\n",
" <td>31</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>17</td>\n",
" <td>9</td>\n",
" <td>2</td>\n",
" <td>838</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>89.473684</td>\n",
" <td>10.526316</td>\n",
" <td>47.368421</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>34</th>\n",
" <td>32</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1338</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>35</th>\n",
" <td>33</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1106</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>36</th>\n",
" <td>37</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>18</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>987</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>5.263158</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>37</th>\n",
" <td>38</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>17</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>1181</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>89.473684</td>\n",
" <td>10.526316</td>\n",
" <td>10.526316</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" <tr>\n",
" <th>38</th>\n",
" <td>39</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1179</td>\n",
" <td>57000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>Alternating</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" id child_gender child_age total_correct_responses correct_responses \\\n",
"22 23 2 6 19 19 \n",
"23 24 1 6 19 19 \n",
"24 25 1 6 19 19 \n",
"25 26 1 6 19 19 \n",
"26 27 1 6 19 19 \n",
"27 28 1 6 19 18 \n",
"28 29 2 6 19 18 \n",
"29 29 2 6 19 18 \n",
"30 29 2 6 19 18 \n",
"31 29 1 7 19 19 \n",
"32 30 1 7 19 18 \n",
"33 31 1 7 19 17 \n",
"34 32 1 7 19 19 \n",
"35 33 1 7 19 19 \n",
"36 37 2 7 19 18 \n",
"37 38 2 7 19 17 \n",
"38 39 2 7 19 19 \n",
"\n",
" commission_errors omission_errors mean_reaction_time total_duration \\\n",
"22 0 0 1023 57000 \n",
"23 0 0 1397 57000 \n",
"24 10 0 961 57000 \n",
"25 8 0 804 57000 \n",
"26 11 0 1180 57000 \n",
"27 2 1 994 57000 \n",
"28 3 1 448 57000 \n",
"29 7 1 733 57000 \n",
"30 5 1 1083 57000 \n",
"31 15 0 771 57000 \n",
"32 9 1 668 57000 \n",
"33 9 2 838 57000 \n",
"34 0 0 1338 57000 \n",
"35 0 0 1106 57000 \n",
"36 1 1 987 57000 \n",
"37 2 2 1181 57000 \n",
"38 0 0 1179 57000 \n",
"\n",
" diagnosis percentage_no_of_correct_responses oer cer \\\n",
"22 No 100.000000 0.000000 0.000000 \n",
"23 No 100.000000 0.000000 0.000000 \n",
"24 No 100.000000 0.000000 52.631579 \n",
"25 No 100.000000 0.000000 42.105263 \n",
"26 No 100.000000 0.000000 57.894737 \n",
"27 No 94.736842 5.263158 10.526316 \n",
"28 No 94.736842 5.263158 15.789474 \n",
"29 No 94.736842 5.263158 36.842105 \n",
"30 No 94.736842 5.263158 26.315789 \n",
"31 No 100.000000 0.000000 78.947368 \n",
"32 No 94.736842 5.263158 47.368421 \n",
"33 No 89.473684 10.526316 47.368421 \n",
"34 No 100.000000 0.000000 0.000000 \n",
"35 No 100.000000 0.000000 0.000000 \n",
"36 No 94.736842 5.263158 5.263158 \n",
"37 No 89.473684 10.526316 10.526316 \n",
"38 No 100.000000 0.000000 0.000000 \n",
"\n",
" game \n",
"22 Alternating \n",
"23 Alternating \n",
"24 Alternating \n",
"25 Alternating \n",
"26 Alternating \n",
"27 Alternating \n",
"28 Alternating \n",
"29 Alternating \n",
"30 Alternating \n",
"31 Alternating \n",
"32 Alternating \n",
"33 Alternating \n",
"34 Alternating \n",
"35 Alternating \n",
"36 Alternating \n",
"37 Alternating \n",
"38 Alternating "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Importing the dataset \n",
"dataset = pd.read_csv('data.csv') \n",
"\n",
"dataset.drop(dataset.index[dataset['game'] == 'Divided'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Sustained'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Selective'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Focused'], inplace = True)\n",
"\n",
"dataset.drop(dataset.index[dataset['child_age'] == 4], inplace = True)\n",
"dataset.drop(dataset.index[dataset['child_age'] == 5], inplace = True)\n",
"\n",
"display(dataset)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "12841129",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[1023. , 100. , 0. , 0. ],\n",
" [1397. , 100. , 0. , 0. ],\n",
" [ 961. , 100. , 0. , 52.63157895],\n",
" [ 804. , 100. , 0. , 42.10526316],\n",
" [1180. , 100. , 0. , 57.89473684],\n",
" [ 994. , 94.73684211, 5.26315789, 10.52631579],\n",
" [ 448. , 94.73684211, 5.26315789, 15.78947368],\n",
" [ 733. , 94.73684211, 5.26315789, 36.84210526],\n",
" [1083. , 94.73684211, 5.26315789, 26.31578947],\n",
" [ 771. , 100. , 0. , 78.94736842],\n",
" [ 668. , 94.73684211, 5.26315789, 47.36842105],\n",
" [ 838. , 89.47368421, 10.52631579, 47.36842105],\n",
" [1338. , 100. , 0. , 0. ],\n",
" [1106. , 100. , 0. , 0. ],\n",
" [ 987. , 94.73684211, 5.26315789, 5.26315789],\n",
" [1181. , 89.47368421, 10.52631579, 10.52631579],\n",
" [1179. , 100. , 0. , 0. ]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# extracting only 11-comission & 12-omission\n",
"x = dataset.iloc[:, [7, 10, 11, 12]].values \n",
"display(x)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "d569e05b",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 0.17087754, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 1.72293381, 0.85125653, -0.85125653, -1.03606733],\n",
" [-0.08641521, 0.85125653, -0.85125653, 1.11187713],\n",
" [-0.73794686, 0.85125653, -0.85125653, 0.68228824],\n",
" [ 0.82240918, 0.85125653, -0.85125653, 1.32667158],\n",
" [ 0.05053093, -0.59587957, 0.59587957, -0.60647843],\n",
" [-2.21530524, -0.59587957, 0.59587957, -0.39168399],\n",
" [-1.03258856, -0.59587957, 0.59587957, 0.46749379],\n",
" [ 0.41987052, -0.59587957, 0.59587957, 0.0379049 ],\n",
" [-0.874893 , 0.85125653, -0.85125653, 2.18584936],\n",
" [-1.30233096, -0.59587957, 0.59587957, 0.89708268],\n",
" [-0.59685083, -2.04301567, 2.04301567, 0.89708268],\n",
" [ 1.47809071, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 0.51531784, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 0.02148175, -0.59587957, 0.59587957, -0.82127288],\n",
" [ 0.82655907, -2.04301567, 2.04301567, -0.60647843],\n",
" [ 0.8182593 , 0.85125653, -0.85125653, -1.03606733]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# standardizing the data\n",
"from sklearn.preprocessing import StandardScaler\n",
"scaler = StandardScaler()\n",
"new_df = scaler.fit_transform(x)\n",
"\n",
"# statistics of scaled data\n",
"pd.DataFrame(new_df).describe()\n",
"\n",
"display(new_df)\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "b5fc4f60",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 6. , 0.17087754, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 6. , 1.72293381, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 6. , -0.08641521, 0.85125653, -0.85125653, 1.11187713],\n",
" [ 6. , -0.73794686, 0.85125653, -0.85125653, 0.68228824],\n",
" [ 6. , 0.82240918, 0.85125653, -0.85125653, 1.32667158],\n",
" [ 6. , 0.05053093, -0.59587957, 0.59587957, -0.60647843],\n",
" [ 6. , -2.21530524, -0.59587957, 0.59587957, -0.39168399],\n",
" [ 6. , -1.03258856, -0.59587957, 0.59587957, 0.46749379],\n",
" [ 6. , 0.41987052, -0.59587957, 0.59587957, 0.0379049 ],\n",
" [ 7. , -0.874893 , 0.85125653, -0.85125653, 2.18584936],\n",
" [ 7. , -1.30233096, -0.59587957, 0.59587957, 0.89708268],\n",
" [ 7. , -0.59685083, -2.04301567, 2.04301567, 0.89708268],\n",
" [ 7. , 1.47809071, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 7. , 0.51531784, 0.85125653, -0.85125653, -1.03606733],\n",
" [ 7. , 0.02148175, -0.59587957, 0.59587957, -0.82127288],\n",
" [ 7. , 0.82655907, -2.04301567, 2.04301567, -0.60647843],\n",
" [ 7. , 0.8182593 , 0.85125653, -0.85125653, -1.03606733]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"x = dataset.iloc[:, [2, 7, 10, 11, 12]].copy()\n",
"x[['mean_reaction_time', 'percentage_no_of_correct_responses', 'oer', 'cer']] = new_df\n",
"x.head()\n",
"x = x.to_numpy()\n",
"display(x)\n"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "58284e31",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Finding the optimal number of clusters using the elbow method\n",
"from sklearn.cluster import KMeans \n",
"wcss_list= [] #Initializing the list for the values of WCSS \n",
" \n",
"#Using for loop for iterations from 1 to 10. \n",
"for i in range(1, 11): \n",
" kmeans = KMeans(n_clusters=i, init='k-means++', random_state= 42) \n",
" kmeans.fit(x) \n",
" wcss_list.append(kmeans.inertia_) \n",
"mtp.plot(range(1, 11), wcss_list) \n",
"mtp.title('The Elobw Method Graph') \n",
"mtp.xlabel('Number of clusters(k)') \n",
"mtp.ylabel('wcss_list') \n",
"mtp.show()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "5d1c61bf",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"[1 1 2 2 2 0 0 0 0 2 0 0 1 1 0 0 1]\n"
]
}
],
"source": [
"#training the K-means model on a dataset \n",
"kmeans = KMeans(n_clusters = 3, init='k-means++', random_state= 42) \n",
"y_predict= kmeans.fit_predict(x) \n",
"print(y_predict)\n"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "984e35be",
"metadata": {},
"outputs": [],
"source": [
"# save the model to disk\n",
"import pickle\n",
"filename = 'modelaa2.sav'\n",
"pickle.dump(kmeans, open(filename, 'wb'))"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "2e691585",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>6</td>\n",
" <td>1023</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>6</td>\n",
" <td>1397</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>6</td>\n",
" <td>961</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>52.631579</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25</th>\n",
" <td>6</td>\n",
" <td>804</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>42.105263</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>6</td>\n",
" <td>1180</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>57.894737</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>6</td>\n",
" <td>994</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>10.526316</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>6</td>\n",
" <td>448</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>15.789474</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>6</td>\n",
" <td>733</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>36.842105</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>30</th>\n",
" <td>6</td>\n",
" <td>1083</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>26.315789</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>31</th>\n",
" <td>7</td>\n",
" <td>771</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>78.947368</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>32</th>\n",
" <td>7</td>\n",
" <td>668</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>47.368421</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>33</th>\n",
" <td>7</td>\n",
" <td>838</td>\n",
" <td>89.473684</td>\n",
" <td>10.526316</td>\n",
" <td>47.368421</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>34</th>\n",
" <td>7</td>\n",
" <td>1338</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>35</th>\n",
" <td>7</td>\n",
" <td>1106</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>36</th>\n",
" <td>7</td>\n",
" <td>987</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>5.263158</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>37</th>\n",
" <td>7</td>\n",
" <td>1181</td>\n",
" <td>89.473684</td>\n",
" <td>10.526316</td>\n",
" <td>10.526316</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>38</th>\n",
" <td>7</td>\n",
" <td>1179</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"22 6 1023 100.000000 \n",
"23 6 1397 100.000000 \n",
"24 6 961 100.000000 \n",
"25 6 804 100.000000 \n",
"26 6 1180 100.000000 \n",
"27 6 994 94.736842 \n",
"28 6 448 94.736842 \n",
"29 6 733 94.736842 \n",
"30 6 1083 94.736842 \n",
"31 7 771 100.000000 \n",
"32 7 668 94.736842 \n",
"33 7 838 89.473684 \n",
"34 7 1338 100.000000 \n",
"35 7 1106 100.000000 \n",
"36 7 987 94.736842 \n",
"37 7 1181 89.473684 \n",
"38 7 1179 100.000000 \n",
"\n",
" oer cer clusters \n",
"22 0.000000 0.000000 1 \n",
"23 0.000000 0.000000 1 \n",
"24 0.000000 52.631579 2 \n",
"25 0.000000 42.105263 2 \n",
"26 0.000000 57.894737 2 \n",
"27 5.263158 10.526316 0 \n",
"28 5.263158 15.789474 0 \n",
"29 5.263158 36.842105 0 \n",
"30 5.263158 26.315789 0 \n",
"31 0.000000 78.947368 2 \n",
"32 5.263158 47.368421 0 \n",
"33 10.526316 47.368421 0 \n",
"34 0.000000 0.000000 1 \n",
"35 0.000000 0.000000 1 \n",
"36 5.263158 5.263158 0 \n",
"37 10.526316 10.526316 0 \n",
"38 0.000000 0.000000 1 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"new_df = dataset.iloc[:, [2, 7, 10, 11, 12]].copy()\n",
"new_df['clusters'] = y_predict\n",
"new_df.head()\n",
"display(new_df)"
]
},
{
"cell_type": "markdown",
"id": "900a0d3f",
"metadata": {},
"source": [
"# Cluster Analysis"
]
},
{
"cell_type": "markdown",
"id": "262e8a4f",
"metadata": {},
"source": [
"## Cluster 1"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "ba8fef3b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"8"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 0])"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "6c5b7397",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>6</td>\n",
" <td>994</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>10.526316</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>6</td>\n",
" <td>448</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>15.789474</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>6</td>\n",
" <td>733</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>36.842105</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>30</th>\n",
" <td>6</td>\n",
" <td>1083</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>26.315789</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>32</th>\n",
" <td>7</td>\n",
" <td>668</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>47.368421</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>33</th>\n",
" <td>7</td>\n",
" <td>838</td>\n",
" <td>89.473684</td>\n",
" <td>10.526316</td>\n",
" <td>47.368421</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>36</th>\n",
" <td>7</td>\n",
" <td>987</td>\n",
" <td>94.736842</td>\n",
" <td>5.263158</td>\n",
" <td>5.263158</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>37</th>\n",
" <td>7</td>\n",
" <td>1181</td>\n",
" <td>89.473684</td>\n",
" <td>10.526316</td>\n",
" <td>10.526316</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"27 6 994 94.736842 \n",
"28 6 448 94.736842 \n",
"29 6 733 94.736842 \n",
"30 6 1083 94.736842 \n",
"32 7 668 94.736842 \n",
"33 7 838 89.473684 \n",
"36 7 987 94.736842 \n",
"37 7 1181 89.473684 \n",
"\n",
" oer cer clusters \n",
"27 5.263158 10.526316 0 \n",
"28 5.263158 15.789474 0 \n",
"29 5.263158 36.842105 0 \n",
"30 5.263158 26.315789 0 \n",
"32 5.263158 47.368421 0 \n",
"33 10.526316 47.368421 0 \n",
"36 5.263158 5.263158 0 \n",
"37 10.526316 10.526316 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"display(cluster_0)\n",
"# cluster_0.boxplot(column =['CER'], grid = False)\n",
"# cluster_0.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "849d9447",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 448\n",
"mean_reaction_time max - 1181\n",
"\n",
"percentage_no_of_correct_responses min - 89.47368421\n",
"percentage_no_of_correct_responses max - 94.73684211\n",
"\n",
"oer min - 5.263157895\n",
"oer max - 10.52631579\n",
"\n",
"cer min - 5.263157895\n",
"cer max - 47.36842105\n"
]
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"\n",
"maxVal = cluster_0['mean_reaction_time'].max()\n",
"minVal = cluster_0['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_0['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['oer'].max()\n",
"minVal = cluster_0['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['cer'].max()\n",
"minVal = cluster_0['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "dd8d7e4f",
"metadata": {},
"source": [
"## Cluster 2"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "f9ed816e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"5"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 1])"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "e3eeb500",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>6</td>\n",
" <td>1023</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>6</td>\n",
" <td>1397</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>34</th>\n",
" <td>7</td>\n",
" <td>1338</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>35</th>\n",
" <td>7</td>\n",
" <td>1106</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>38</th>\n",
" <td>7</td>\n",
" <td>1179</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses oer \\\n",
"22 6 1023 100.0 0.0 \n",
"23 6 1397 100.0 0.0 \n",
"34 7 1338 100.0 0.0 \n",
"35 7 1106 100.0 0.0 \n",
"38 7 1179 100.0 0.0 \n",
"\n",
" cer clusters \n",
"22 0.0 1 \n",
"23 0.0 1 \n",
"34 0.0 1 \n",
"35 0.0 1 \n",
"38 0.0 1 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"display(cluster_1)\n",
"#cluster_1.boxplot(column =['CER'], grid = False)\n",
"#cluster_1.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "2ab1bc45",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 1023\n",
"mean_reaction_time max - 1397\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n",
"\n",
"cer min - 0.0\n",
"cer max - 0.0\n"
]
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"\n",
"maxVal = cluster_1['mean_reaction_time'].max()\n",
"minVal = cluster_1['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_1['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['oer'].max()\n",
"minVal = cluster_1['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"\n",
"print()\n",
"\n",
"maxVal = cluster_1['cer'].max()\n",
"minVal = cluster_1['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "e62b9a30",
"metadata": {},
"source": [
"## Cluster 3"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "105ff3ad",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"4"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 2])"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "9c9ac4a6",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>6</td>\n",
" <td>961</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>52.631579</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25</th>\n",
" <td>6</td>\n",
" <td>804</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>42.105263</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>6</td>\n",
" <td>1180</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>57.894737</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>31</th>\n",
" <td>7</td>\n",
" <td>771</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>78.947368</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses oer \\\n",
"24 6 961 100.0 0.0 \n",
"25 6 804 100.0 0.0 \n",
"26 6 1180 100.0 0.0 \n",
"31 7 771 100.0 0.0 \n",
"\n",
" cer clusters \n",
"24 52.631579 2 \n",
"25 42.105263 2 \n",
"26 57.894737 2 \n",
"31 78.947368 2 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_2 = new_df[new_df[\"clusters\"] == 2 ]\n",
"display(cluster_2)\n",
"#cluster_2.boxplot(column =['CER'], grid = False)\n",
"#cluster_2.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 18,
"id": "09b1596d",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 771\n",
"mean_reaction_time max - 1180\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n",
"\n",
"cer min - 42.10526316\n",
"cer max - 78.94736842\n"
]
}
],
"source": [
"cluster_2 = new_df[new_df[\"clusters\"] == 2 ]\n",
"\n",
"maxVal = cluster_2['mean_reaction_time'].max()\n",
"minVal = cluster_2['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_2['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_2['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_2['oer'].max()\n",
"minVal = cluster_2['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"\n",
"print()\n",
"\n",
"maxVal = cluster_2['cer'].max()\n",
"minVal = cluster_2['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "37d3d977",
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"id": "796872b0",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "bcdc5589",
"metadata": {},
"outputs": [],
"source": [
"# importing libraries \n",
"import numpy as nm \n",
"import matplotlib.pyplot as mtp \n",
"import pandas as pd \n",
"from sklearn.cluster import DBSCAN\n",
"from numpy import unique\n",
"from numpy import where\n",
"from matplotlib import pyplot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "f448f999",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>child_gender</th>\n",
" <th>child_age</th>\n",
" <th>total_correct_responses</th>\n",
" <th>correct_responses</th>\n",
" <th>commission_errors</th>\n",
" <th>omission_errors</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>total_duration</th>\n",
" <th>diagnosis</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>game</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>39</th>\n",
" <td>40</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>3</td>\n",
" <td>3</td>\n",
" <td>1303</td>\n",
" <td>70000</td>\n",
" <td>Yes</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>40</th>\n",
" <td>41</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>2</td>\n",
" <td>3</td>\n",
" <td>1384</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>41</th>\n",
" <td>42</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>1</td>\n",
" <td>1191</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>50.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>42</th>\n",
" <td>43</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>4</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>1335</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>50.0</td>\n",
" <td>50.0</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>43</th>\n",
" <td>44</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>6</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>1253</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>44</th>\n",
" <td>45</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>1239</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>45</th>\n",
" <td>46</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>1</td>\n",
" <td>1109</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>50.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>46</th>\n",
" <td>47</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>952</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>47</th>\n",
" <td>48</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>928</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>48</th>\n",
" <td>49</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>3</td>\n",
" <td>1</td>\n",
" <td>1428</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>49</th>\n",
" <td>50</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>1115</td>\n",
" <td>70000</td>\n",
" <td>No</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>75.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50</th>\n",
" <td>51</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>1157</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>51</th>\n",
" <td>52</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>2</td>\n",
" <td>1097</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>52</th>\n",
" <td>53</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1160</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>53</th>\n",
" <td>54</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1053</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>54</th>\n",
" <td>55</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>953</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>55</th>\n",
" <td>56</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>2</td>\n",
" <td>1303</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>56</th>\n",
" <td>57</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>3</td>\n",
" <td>6</td>\n",
" <td>5</td>\n",
" <td>1257</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>37.5</td>\n",
" <td>62.5</td>\n",
" <td>75.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>57</th>\n",
" <td>58</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1008</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>58</th>\n",
" <td>59</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>8</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>7</td>\n",
" <td>1188</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>12.5</td>\n",
" <td>87.5</td>\n",
" <td>87.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>59</th>\n",
" <td>60</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>670</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>60</th>\n",
" <td>61</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>1</td>\n",
" <td>614</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>50.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>61</th>\n",
" <td>62</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>778</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>62</th>\n",
" <td>63</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>778</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>63</th>\n",
" <td>64</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>4</td>\n",
" <td>3</td>\n",
" <td>832</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>50.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>64</th>\n",
" <td>65</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1173</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>65</th>\n",
" <td>66</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1007</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>66</th>\n",
" <td>67</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1025</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>67</th>\n",
" <td>68</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>3</td>\n",
" <td>1</td>\n",
" <td>1012</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>68</th>\n",
" <td>69</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>5</td>\n",
" <td>1</td>\n",
" <td>845</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>62.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>69</th>\n",
" <td>70</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>850</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>70</th>\n",
" <td>71</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>586</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>71</th>\n",
" <td>72</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>2</td>\n",
" <td>1</td>\n",
" <td>845</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>25.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>72</th>\n",
" <td>73</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1033</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>73</th>\n",
" <td>74</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>867</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>74</th>\n",
" <td>75</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>2</td>\n",
" <td>901</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>37.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75</th>\n",
" <td>76</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>7</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>955</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>76</th>\n",
" <td>77</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>780</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77</th>\n",
" <td>78</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>694</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>12.5</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" <tr>\n",
" <th>78</th>\n",
" <td>79</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>719</td>\n",
" <td>60000</td>\n",
" <td>No</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>0.0</td>\n",
" <td>Divided</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" id child_gender child_age total_correct_responses correct_responses \\\n",
"39 40 2 4 8 5 \n",
"40 41 1 4 8 5 \n",
"41 42 2 4 8 7 \n",
"42 43 2 4 8 4 \n",
"43 44 1 4 8 6 \n",
"44 45 1 4 8 8 \n",
"45 46 1 4 8 7 \n",
"46 47 1 4 8 8 \n",
"47 48 1 4 8 8 \n",
"48 49 1 4 8 7 \n",
"49 50 1 4 8 5 \n",
"50 51 2 5 8 8 \n",
"51 52 2 5 8 6 \n",
"52 53 2 5 8 8 \n",
"53 54 2 5 8 7 \n",
"54 55 2 5 8 7 \n",
"55 56 2 5 8 6 \n",
"56 57 2 5 8 3 \n",
"57 58 1 5 8 8 \n",
"58 59 1 5 8 1 \n",
"59 60 2 6 8 7 \n",
"60 61 2 6 8 7 \n",
"61 62 2 6 8 8 \n",
"62 63 2 6 8 8 \n",
"63 64 2 6 8 5 \n",
"64 65 1 6 8 7 \n",
"65 66 1 6 8 7 \n",
"66 67 1 6 8 7 \n",
"67 68 1 6 8 7 \n",
"68 69 1 6 8 7 \n",
"69 70 1 7 8 8 \n",
"70 71 1 7 8 6 \n",
"71 72 1 7 8 7 \n",
"72 73 1 7 8 8 \n",
"73 74 1 7 8 7 \n",
"74 75 1 7 8 6 \n",
"75 76 2 7 8 7 \n",
"76 77 2 7 8 8 \n",
"77 78 2 7 8 8 \n",
"78 79 2 7 8 5 \n",
"\n",
" commission_errors omission_errors mean_reaction_time total_duration \\\n",
"39 3 3 1303 70000 \n",
"40 2 3 1384 70000 \n",
"41 4 1 1191 70000 \n",
"42 2 4 1335 70000 \n",
"43 2 2 1253 70000 \n",
"44 2 0 1239 70000 \n",
"45 4 1 1109 70000 \n",
"46 2 0 952 70000 \n",
"47 0 0 928 70000 \n",
"48 3 1 1428 70000 \n",
"49 6 3 1115 70000 \n",
"50 2 0 1157 60000 \n",
"51 3 2 1097 60000 \n",
"52 0 0 1160 60000 \n",
"53 1 1 1053 60000 \n",
"54 0 1 953 60000 \n",
"55 3 2 1303 60000 \n",
"56 6 5 1257 60000 \n",
"57 0 0 1008 60000 \n",
"58 7 7 1188 60000 \n",
"59 1 1 670 60000 \n",
"60 4 1 614 60000 \n",
"61 2 0 778 60000 \n",
"62 1 0 778 60000 \n",
"63 4 3 832 60000 \n",
"64 1 1 1173 60000 \n",
"65 1 1 1007 60000 \n",
"66 1 1 1025 60000 \n",
"67 3 1 1012 60000 \n",
"68 5 1 845 60000 \n",
"69 3 0 850 60000 \n",
"70 0 2 586 60000 \n",
"71 2 1 845 60000 \n",
"72 0 0 1033 60000 \n",
"73 1 1 867 60000 \n",
"74 3 2 901 60000 \n",
"75 1 1 955 60000 \n",
"76 1 0 780 60000 \n",
"77 1 0 694 60000 \n",
"78 0 3 719 60000 \n",
"\n",
" diagnosis percentage_no_of_correct_responses oer cer game \n",
"39 Yes 62.5 37.5 37.5 Divided \n",
"40 No 62.5 37.5 25.0 Divided \n",
"41 No 87.5 12.5 50.0 Divided \n",
"42 No 50.0 50.0 25.0 Divided \n",
"43 No 75.0 25.0 25.0 Divided \n",
"44 No 100.0 0.0 25.0 Divided \n",
"45 No 87.5 12.5 50.0 Divided \n",
"46 No 100.0 0.0 25.0 Divided \n",
"47 No 100.0 0.0 0.0 Divided \n",
"48 No 87.5 12.5 37.5 Divided \n",
"49 No 62.5 37.5 75.0 Divided \n",
"50 No 100.0 0.0 25.0 Divided \n",
"51 No 75.0 25.0 37.5 Divided \n",
"52 No 100.0 0.0 0.0 Divided \n",
"53 No 87.5 12.5 12.5 Divided \n",
"54 No 87.5 12.5 0.0 Divided \n",
"55 No 75.0 25.0 37.5 Divided \n",
"56 No 37.5 62.5 75.0 Divided \n",
"57 No 100.0 0.0 0.0 Divided \n",
"58 No 12.5 87.5 87.5 Divided \n",
"59 No 87.5 12.5 12.5 Divided \n",
"60 No 87.5 12.5 50.0 Divided \n",
"61 No 100.0 0.0 25.0 Divided \n",
"62 No 100.0 0.0 12.5 Divided \n",
"63 No 62.5 37.5 50.0 Divided \n",
"64 No 87.5 12.5 12.5 Divided \n",
"65 No 87.5 12.5 12.5 Divided \n",
"66 No 87.5 12.5 12.5 Divided \n",
"67 No 87.5 12.5 37.5 Divided \n",
"68 No 87.5 12.5 62.5 Divided \n",
"69 No 100.0 0.0 37.5 Divided \n",
"70 No 75.0 25.0 0.0 Divided \n",
"71 No 87.5 12.5 25.0 Divided \n",
"72 No 100.0 0.0 0.0 Divided \n",
"73 No 87.5 12.5 12.5 Divided \n",
"74 No 75.0 25.0 37.5 Divided \n",
"75 No 87.5 12.5 12.5 Divided \n",
"76 No 100.0 0.0 12.5 Divided \n",
"77 No 100.0 0.0 12.5 Divided \n",
"78 No 62.5 37.5 0.0 Divided "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Importing the dataset \n",
"dataset = pd.read_csv('data.csv') \n",
"dataset.drop(dataset.index[dataset['game'] == 'Alternating'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Sustained'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Selective'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Focused'], inplace = True)\n",
"display(dataset)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "12841129",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[1303. , 62.5, 37.5, 37.5],\n",
" [1384. , 62.5, 37.5, 25. ],\n",
" [1191. , 87.5, 12.5, 50. ],\n",
" [1335. , 50. , 50. , 25. ],\n",
" [1253. , 75. , 25. , 25. ],\n",
" [1239. , 100. , 0. , 25. ],\n",
" [1109. , 87.5, 12.5, 50. ],\n",
" [ 952. , 100. , 0. , 25. ],\n",
" [ 928. , 100. , 0. , 0. ],\n",
" [1428. , 87.5, 12.5, 37.5],\n",
" [1115. , 62.5, 37.5, 75. ],\n",
" [1157. , 100. , 0. , 25. ],\n",
" [1097. , 75. , 25. , 37.5],\n",
" [1160. , 100. , 0. , 0. ],\n",
" [1053. , 87.5, 12.5, 12.5],\n",
" [ 953. , 87.5, 12.5, 0. ],\n",
" [1303. , 75. , 25. , 37.5],\n",
" [1257. , 37.5, 62.5, 75. ],\n",
" [1008. , 100. , 0. , 0. ],\n",
" [1188. , 12.5, 87.5, 87.5],\n",
" [ 670. , 87.5, 12.5, 12.5],\n",
" [ 614. , 87.5, 12.5, 50. ],\n",
" [ 778. , 100. , 0. , 25. ],\n",
" [ 778. , 100. , 0. , 12.5],\n",
" [ 832. , 62.5, 37.5, 50. ],\n",
" [1173. , 87.5, 12.5, 12.5],\n",
" [1007. , 87.5, 12.5, 12.5],\n",
" [1025. , 87.5, 12.5, 12.5],\n",
" [1012. , 87.5, 12.5, 37.5],\n",
" [ 845. , 87.5, 12.5, 62.5],\n",
" [ 850. , 100. , 0. , 37.5],\n",
" [ 586. , 75. , 25. , 0. ],\n",
" [ 845. , 87.5, 12.5, 25. ],\n",
" [1033. , 100. , 0. , 0. ],\n",
" [ 867. , 87.5, 12.5, 12.5],\n",
" [ 901. , 75. , 25. , 37.5],\n",
" [ 955. , 87.5, 12.5, 12.5],\n",
" [ 780. , 100. , 0. , 12.5],\n",
" [ 694. , 100. , 0. , 12.5],\n",
" [ 719. , 62.5, 37.5, 0. ]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# extracting only 11-comission & 12-omission\n",
"x = dataset.iloc[:, [7, 10, 11, 12]].values \n",
"display(x)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "d569e05b",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 1.35119909, -1.05730976, 1.05730976, 0.46525043],\n",
" [ 1.72400715, -1.05730976, 1.05730976, -0.09868948],\n",
" [ 0.8357114 , 0.26432744, -0.26432744, 1.02919034],\n",
" [ 1.49848129, -1.71812836, 1.71812836, -0.09868948],\n",
" [ 1.12107066, -0.39649116, 0.39649116, -0.09868948],\n",
" [ 1.0566347 , 0.92514604, -0.92514604, -0.09868948],\n",
" [ 0.45830077, 0.26432744, -0.26432744, 1.02919034],\n",
" [-0.2643025 , 0.92514604, -0.92514604, -0.09868948],\n",
" [-0.37476415, 0.92514604, -0.92514604, -1.22656931],\n",
" [ 1.92652017, 0.26432744, -0.26432744, 0.46525043],\n",
" [ 0.48591619, -1.05730976, 1.05730976, 2.15707017],\n",
" [ 0.67922407, 0.92514604, -0.92514604, -0.09868948],\n",
" [ 0.40306995, -0.39649116, 0.39649116, 0.46525043],\n",
" [ 0.69303177, 0.92514604, -0.92514604, -1.22656931],\n",
" [ 0.20055693, 0.26432744, -0.26432744, -0.6626294 ],\n",
" [-0.25969994, 0.26432744, -0.26432744, -1.22656931],\n",
" [ 1.35119909, -0.39649116, 0.39649116, 0.46525043],\n",
" [ 1.13948093, -2.37894696, 2.37894696, 2.15707017],\n",
" [-0.00655866, 0.92514604, -0.92514604, -1.22656931],\n",
" [ 0.8219037 , -3.70058416, 3.70058416, 2.72101008],\n",
" [-1.56222686, 0.26432744, -0.26432744, -0.6626294 ],\n",
" [-1.81997071, 0.26432744, -0.26432744, 1.02919034],\n",
" [-1.06514945, 0.92514604, -0.92514604, -0.09868948],\n",
" [-1.06514945, 0.92514604, -0.92514604, -0.6626294 ],\n",
" [-0.81661074, -1.05730976, 1.05730976, 1.02919034],\n",
" [ 0.75286517, 0.26432744, -0.26432744, -0.6626294 ],\n",
" [-0.01116123, 0.26432744, -0.26432744, -0.6626294 ],\n",
" [ 0.07168501, 0.26432744, -0.26432744, -0.6626294 ],\n",
" [ 0.01185161, 0.26432744, -0.26432744, 0.46525043],\n",
" [-0.75677735, 0.26432744, -0.26432744, 1.59313025],\n",
" [-0.73376451, 0.92514604, -0.92514604, 0.46525043],\n",
" [-1.94884263, -0.39649116, 0.39649116, -1.22656931],\n",
" [-0.75677735, 0.26432744, -0.26432744, -0.09868948],\n",
" [ 0.10850556, 0.92514604, -0.92514604, -1.22656931],\n",
" [-0.65552084, 0.26432744, -0.26432744, -0.6626294 ],\n",
" [-0.49903351, -0.39649116, 0.39649116, 0.46525043],\n",
" [-0.2504948 , 0.26432744, -0.26432744, -0.6626294 ],\n",
" [-1.05594431, 0.92514604, -0.92514604, -0.6626294 ],\n",
" [-1.45176522, 0.92514604, -0.92514604, -0.6626294 ],\n",
" [-1.336701 , -1.05730976, 1.05730976, -1.22656931]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# standardizing the data\n",
"from sklearn.preprocessing import StandardScaler\n",
"scaler = StandardScaler()\n",
"new_df = scaler.fit_transform(x)\n",
"\n",
"# statistics of scaled data\n",
"pd.DataFrame(new_df).describe()\n",
"\n",
"display(new_df)\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "b5fc4f60",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 4.00000000e+00, 1.35119909e+00, -1.05730976e+00,\n",
" 1.05730976e+00, 4.65250428e-01],\n",
" [ 4.00000000e+00, 1.72400715e+00, -1.05730976e+00,\n",
" 1.05730976e+00, -9.86894847e-02],\n",
" [ 4.00000000e+00, 8.35711402e-01, 2.64327440e-01,\n",
" -2.64327440e-01, 1.02919034e+00],\n",
" [ 4.00000000e+00, 1.49848129e+00, -1.71812836e+00,\n",
" 1.71812836e+00, -9.86894847e-02],\n",
" [ 4.00000000e+00, 1.12107066e+00, -3.96491160e-01,\n",
" 3.96491160e-01, -9.86894847e-02],\n",
" [ 4.00000000e+00, 1.05663470e+00, 9.25146041e-01,\n",
" -9.25146041e-01, -9.86894847e-02],\n",
" [ 4.00000000e+00, 4.58300773e-01, 2.64327440e-01,\n",
" -2.64327440e-01, 1.02919034e+00],\n",
" [ 4.00000000e+00, -2.64302505e-01, 9.25146041e-01,\n",
" -9.25146041e-01, -9.86894847e-02],\n",
" [ 4.00000000e+00, -3.74764152e-01, 9.25146041e-01,\n",
" -9.25146041e-01, -1.22656931e+00],\n",
" [ 4.00000000e+00, 1.92652017e+00, 2.64327440e-01,\n",
" -2.64327440e-01, 4.65250428e-01],\n",
" [ 4.00000000e+00, 4.85916185e-01, -1.05730976e+00,\n",
" 1.05730976e+00, 2.15707017e+00],\n",
" [ 5.00000000e+00, 6.79224068e-01, 9.25146041e-01,\n",
" -9.25146041e-01, -9.86894847e-02],\n",
" [ 5.00000000e+00, 4.03069949e-01, -3.96491160e-01,\n",
" 3.96491160e-01, 4.65250428e-01],\n",
" [ 5.00000000e+00, 6.93031774e-01, 9.25146041e-01,\n",
" -9.25146041e-01, -1.22656931e+00],\n",
" [ 5.00000000e+00, 2.00556929e-01, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 5.00000000e+00, -2.59699936e-01, 2.64327440e-01,\n",
" -2.64327440e-01, -1.22656931e+00],\n",
" [ 5.00000000e+00, 1.35119909e+00, -3.96491160e-01,\n",
" 3.96491160e-01, 4.65250428e-01],\n",
" [ 5.00000000e+00, 1.13948093e+00, -2.37894696e+00,\n",
" 2.37894696e+00, 2.15707017e+00],\n",
" [ 5.00000000e+00, -6.55866032e-03, 9.25146041e-01,\n",
" -9.25146041e-01, -1.22656931e+00],\n",
" [ 5.00000000e+00, 8.21903696e-01, -3.70058416e+00,\n",
" 3.70058416e+00, 2.72101008e+00],\n",
" [ 6.00000000e+00, -1.56222686e+00, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 6.00000000e+00, -1.81997071e+00, 2.64327440e-01,\n",
" -2.64327440e-01, 1.02919034e+00],\n",
" [ 6.00000000e+00, -1.06514945e+00, 9.25146041e-01,\n",
" -9.25146041e-01, -9.86894847e-02],\n",
" [ 6.00000000e+00, -1.06514945e+00, 9.25146041e-01,\n",
" -9.25146041e-01, -6.62629397e-01],\n",
" [ 6.00000000e+00, -8.16610742e-01, -1.05730976e+00,\n",
" 1.05730976e+00, 1.02919034e+00],\n",
" [ 6.00000000e+00, 7.52865167e-01, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 6.00000000e+00, -1.11612290e-02, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 6.00000000e+00, 7.16850067e-02, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 6.00000000e+00, 1.18516143e-02, 2.64327440e-01,\n",
" -2.64327440e-01, 4.65250428e-01],\n",
" [ 6.00000000e+00, -7.56777350e-01, 2.64327440e-01,\n",
" -2.64327440e-01, 1.59313025e+00],\n",
" [ 7.00000000e+00, -7.33764507e-01, 9.25146041e-01,\n",
" -9.25146041e-01, 4.65250428e-01],\n",
" [ 7.00000000e+00, -1.94884263e+00, -3.96491160e-01,\n",
" 3.96491160e-01, -1.22656931e+00],\n",
" [ 7.00000000e+00, -7.56777350e-01, 2.64327440e-01,\n",
" -2.64327440e-01, -9.86894847e-02],\n",
" [ 7.00000000e+00, 1.08505556e-01, 9.25146041e-01,\n",
" -9.25146041e-01, -1.22656931e+00],\n",
" [ 7.00000000e+00, -6.55520840e-01, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 7.00000000e+00, -4.99033506e-01, -3.96491160e-01,\n",
" 3.96491160e-01, 4.65250428e-01],\n",
" [ 7.00000000e+00, -2.50494799e-01, 2.64327440e-01,\n",
" -2.64327440e-01, -6.62629397e-01],\n",
" [ 7.00000000e+00, -1.05594431e+00, 9.25146041e-01,\n",
" -9.25146041e-01, -6.62629397e-01],\n",
" [ 7.00000000e+00, -1.45176522e+00, 9.25146041e-01,\n",
" -9.25146041e-01, -6.62629397e-01],\n",
" [ 7.00000000e+00, -1.33670100e+00, -1.05730976e+00,\n",
" 1.05730976e+00, -1.22656931e+00]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"x = dataset.iloc[:, [2, 7, 10, 11, 12]].copy()\n",
"x[['mean_reaction_time', 'percentage_no_of_correct_responses', 'oer', 'cer']] = new_df\n",
"x.head()\n",
"x = x.to_numpy()\n",
"display(x)\n"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "58284e31",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Finding the optimal number of clusters using the elbow method\n",
"from sklearn.cluster import KMeans \n",
"wcss_list= [] #Initializing the list for the values of WCSS \n",
" \n",
"#Using for loop for iterations from 1 to 10. \n",
"for i in range(1, 11): \n",
" kmeans = KMeans(n_clusters=i, init='k-means++', random_state= 42) \n",
" kmeans.fit(x) \n",
" wcss_list.append(kmeans.inertia_) \n",
"mtp.plot(range(1, 11), wcss_list) \n",
"mtp.title('The Elobw Method Graph') \n",
"mtp.xlabel('Number of clusters(k)') \n",
"mtp.ylabel('wcss_list') \n",
"mtp.show()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "5d1c61bf",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.cluster import Birch\n",
"\n",
"# define the model\n",
"model = Birch(threshold=0.01, n_clusters=4)\n",
"# fit the model\n",
"model.fit(x)\n",
"# assign a cluster to each example\n",
"yhat = model.predict(x)\n",
"# retrieve unique clusters\n",
"clusters = unique(yhat)\n"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "2e691585",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>39</th>\n",
" <td>4</td>\n",
" <td>1303</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>37.5</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>40</th>\n",
" <td>4</td>\n",
" <td>1384</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>25.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>41</th>\n",
" <td>4</td>\n",
" <td>1191</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>50.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>42</th>\n",
" <td>4</td>\n",
" <td>1335</td>\n",
" <td>50.0</td>\n",
" <td>50.0</td>\n",
" <td>25.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>43</th>\n",
" <td>4</td>\n",
" <td>1253</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>25.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>44</th>\n",
" <td>4</td>\n",
" <td>1239</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>45</th>\n",
" <td>4</td>\n",
" <td>1109</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>50.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>46</th>\n",
" <td>4</td>\n",
" <td>952</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>47</th>\n",
" <td>4</td>\n",
" <td>928</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>48</th>\n",
" <td>4</td>\n",
" <td>1428</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>37.5</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>49</th>\n",
" <td>4</td>\n",
" <td>1115</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>75.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50</th>\n",
" <td>5</td>\n",
" <td>1157</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>51</th>\n",
" <td>5</td>\n",
" <td>1097</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>37.5</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>52</th>\n",
" <td>5</td>\n",
" <td>1160</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>53</th>\n",
" <td>5</td>\n",
" <td>1053</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>54</th>\n",
" <td>5</td>\n",
" <td>953</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>0.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>55</th>\n",
" <td>5</td>\n",
" <td>1303</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>37.5</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>56</th>\n",
" <td>5</td>\n",
" <td>1257</td>\n",
" <td>37.5</td>\n",
" <td>62.5</td>\n",
" <td>75.0</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>57</th>\n",
" <td>5</td>\n",
" <td>1008</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>58</th>\n",
" <td>5</td>\n",
" <td>1188</td>\n",
" <td>12.5</td>\n",
" <td>87.5</td>\n",
" <td>87.5</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>59</th>\n",
" <td>6</td>\n",
" <td>670</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>60</th>\n",
" <td>6</td>\n",
" <td>614</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>50.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>61</th>\n",
" <td>6</td>\n",
" <td>778</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>25.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>62</th>\n",
" <td>6</td>\n",
" <td>778</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>63</th>\n",
" <td>6</td>\n",
" <td>832</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>50.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>64</th>\n",
" <td>6</td>\n",
" <td>1173</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>65</th>\n",
" <td>6</td>\n",
" <td>1007</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>66</th>\n",
" <td>6</td>\n",
" <td>1025</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>67</th>\n",
" <td>6</td>\n",
" <td>1012</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>37.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>68</th>\n",
" <td>6</td>\n",
" <td>845</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>62.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>69</th>\n",
" <td>7</td>\n",
" <td>850</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>37.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>70</th>\n",
" <td>7</td>\n",
" <td>586</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>71</th>\n",
" <td>7</td>\n",
" <td>845</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>25.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>72</th>\n",
" <td>7</td>\n",
" <td>1033</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>73</th>\n",
" <td>7</td>\n",
" <td>867</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>74</th>\n",
" <td>7</td>\n",
" <td>901</td>\n",
" <td>75.0</td>\n",
" <td>25.0</td>\n",
" <td>37.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75</th>\n",
" <td>7</td>\n",
" <td>955</td>\n",
" <td>87.5</td>\n",
" <td>12.5</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>76</th>\n",
" <td>7</td>\n",
" <td>780</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77</th>\n",
" <td>7</td>\n",
" <td>694</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>12.5</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>78</th>\n",
" <td>7</td>\n",
" <td>719</td>\n",
" <td>62.5</td>\n",
" <td>37.5</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses oer \\\n",
"39 4 1303 62.5 37.5 \n",
"40 4 1384 62.5 37.5 \n",
"41 4 1191 87.5 12.5 \n",
"42 4 1335 50.0 50.0 \n",
"43 4 1253 75.0 25.0 \n",
"44 4 1239 100.0 0.0 \n",
"45 4 1109 87.5 12.5 \n",
"46 4 952 100.0 0.0 \n",
"47 4 928 100.0 0.0 \n",
"48 4 1428 87.5 12.5 \n",
"49 4 1115 62.5 37.5 \n",
"50 5 1157 100.0 0.0 \n",
"51 5 1097 75.0 25.0 \n",
"52 5 1160 100.0 0.0 \n",
"53 5 1053 87.5 12.5 \n",
"54 5 953 87.5 12.5 \n",
"55 5 1303 75.0 25.0 \n",
"56 5 1257 37.5 62.5 \n",
"57 5 1008 100.0 0.0 \n",
"58 5 1188 12.5 87.5 \n",
"59 6 670 87.5 12.5 \n",
"60 6 614 87.5 12.5 \n",
"61 6 778 100.0 0.0 \n",
"62 6 778 100.0 0.0 \n",
"63 6 832 62.5 37.5 \n",
"64 6 1173 87.5 12.5 \n",
"65 6 1007 87.5 12.5 \n",
"66 6 1025 87.5 12.5 \n",
"67 6 1012 87.5 12.5 \n",
"68 6 845 87.5 12.5 \n",
"69 7 850 100.0 0.0 \n",
"70 7 586 75.0 25.0 \n",
"71 7 845 87.5 12.5 \n",
"72 7 1033 100.0 0.0 \n",
"73 7 867 87.5 12.5 \n",
"74 7 901 75.0 25.0 \n",
"75 7 955 87.5 12.5 \n",
"76 7 780 100.0 0.0 \n",
"77 7 694 100.0 0.0 \n",
"78 7 719 62.5 37.5 \n",
"\n",
" cer clusters \n",
"39 37.5 1 \n",
"40 25.0 1 \n",
"41 50.0 1 \n",
"42 25.0 1 \n",
"43 25.0 1 \n",
"44 25.0 3 \n",
"45 50.0 1 \n",
"46 25.0 3 \n",
"47 0.0 3 \n",
"48 37.5 1 \n",
"49 75.0 1 \n",
"50 25.0 3 \n",
"51 37.5 1 \n",
"52 0.0 3 \n",
"53 12.5 3 \n",
"54 0.0 3 \n",
"55 37.5 1 \n",
"56 75.0 2 \n",
"57 0.0 3 \n",
"58 87.5 2 \n",
"59 12.5 0 \n",
"60 50.0 0 \n",
"61 25.0 0 \n",
"62 12.5 0 \n",
"63 50.0 0 \n",
"64 12.5 0 \n",
"65 12.5 0 \n",
"66 12.5 0 \n",
"67 37.5 0 \n",
"68 62.5 0 \n",
"69 37.5 0 \n",
"70 0.0 0 \n",
"71 25.0 0 \n",
"72 0.0 0 \n",
"73 12.5 0 \n",
"74 37.5 0 \n",
"75 12.5 0 \n",
"76 12.5 0 \n",
"77 12.5 0 \n",
"78 0.0 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"new_df = dataset.iloc[:, [2, 7, 10, 11, 12]].copy()\n",
"new_df['clusters'] = yhat\n",
"new_df.head()\n",
"display(new_df)"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "dd477754",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Silhouette Coefficient: 0.319\n",
"Calinski-Harabasz Index: 25.712\n",
"Davies-Bouldin Index: 0.865\n"
]
}
],
"source": [
"from sklearn.metrics import silhouette_score,calinski_harabasz_score,davies_bouldin_score\n",
"\n",
"print(\"Silhouette Coefficient: %0.3f\" % silhouette_score(x, yhat))\n",
"print(\"Calinski-Harabasz Index: %0.3f\" % calinski_harabasz_score(x, yhat))\n",
"print(\"Davies-Bouldin Index: %0.3f\" % davies_bouldin_score(x, yhat))"
]
},
{
"cell_type": "markdown",
"id": "900a0d3f",
"metadata": {},
"source": [
"# Cluster Analysis"
]
},
{
"cell_type": "markdown",
"id": "262e8a4f",
"metadata": {},
"source": [
"## Cluster 1"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "ba8fef3b",
"metadata": {},
"outputs": [],
"source": [
"len(new_df[new_df[\"clusters\"] == 0])"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "6c5b7397",
"metadata": {},
"outputs": [],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"display(cluster_0)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "849d9447",
"metadata": {},
"outputs": [],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"\n",
"maxVal = cluster_0['mean_reaction_time'].max()\n",
"minVal = cluster_0['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_0['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['oer'].max()\n",
"minVal = cluster_0['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['cer'].max()\n",
"minVal = cluster_0['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "dd8d7e4f",
"metadata": {},
"source": [
"## Cluster 2"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "f9ed816e",
"metadata": {},
"outputs": [],
"source": [
"len(new_df[new_df[\"clusters\"] == 1])"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "e3eeb500",
"metadata": {},
"outputs": [],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"display(cluster_1)\n",
"#cluster_1.boxplot(column =['CER'], grid = False)\n",
"#cluster_1.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "2ab1bc45",
"metadata": {},
"outputs": [],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"\n",
"maxVal = cluster_1['mean_reaction_time'].max()\n",
"minVal = cluster_1['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_1['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['oer'].max()\n",
"minVal = cluster_1['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"\n",
"print()\n",
"\n",
"maxVal = cluster_1['cer'].max()\n",
"minVal = cluster_1['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "61fc2f95",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
This source diff could not be displayed because it is too large. You can view the blob instead.
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "bcdc5589",
"metadata": {},
"outputs": [],
"source": [
"# importing libraries \n",
"import numpy as nm \n",
"import matplotlib.pyplot as mtp \n",
"import pandas as pd \n",
"from sklearn.cluster import DBSCAN\n",
"from numpy import unique\n",
"from numpy import where\n",
"from matplotlib import pyplot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "f448f999",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>child_gender</th>\n",
" <th>child_age</th>\n",
" <th>total_correct_responses</th>\n",
" <th>correct_responses</th>\n",
" <th>commission_errors</th>\n",
" <th>omission_errors</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>total_duration</th>\n",
" <th>diagnosis</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>game</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>79</th>\n",
" <td>80</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1448</td>\n",
" <td>74000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>81</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1331</td>\n",
" <td>78000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>81</th>\n",
" <td>82</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1426</td>\n",
" <td>74500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>83</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1632</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>83</th>\n",
" <td>84</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1340</td>\n",
" <td>72000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>85</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1564</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>85</th>\n",
" <td>86</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1366</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>86</th>\n",
" <td>87</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1291</td>\n",
" <td>74500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>87</th>\n",
" <td>88</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2032</td>\n",
" <td>71500</td>\n",
" <td>No</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>88</th>\n",
" <td>89</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1789</td>\n",
" <td>74000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>90</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1680</td>\n",
" <td>73500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>90</th>\n",
" <td>91</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1317</td>\n",
" <td>67500</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>91</th>\n",
" <td>92</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1040</td>\n",
" <td>70500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>92</th>\n",
" <td>93</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1142</td>\n",
" <td>75500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>93</th>\n",
" <td>94</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1168</td>\n",
" <td>75000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>94</th>\n",
" <td>95</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1150</td>\n",
" <td>77000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>95</th>\n",
" <td>96</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1270</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>96</th>\n",
" <td>97</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1457</td>\n",
" <td>73000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>97</th>\n",
" <td>98</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1180</td>\n",
" <td>72500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>98</th>\n",
" <td>99</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1261</td>\n",
" <td>73500</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>99</th>\n",
" <td>100</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>1234</td>\n",
" <td>71500</td>\n",
" <td>No</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>100</th>\n",
" <td>101</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1165</td>\n",
" <td>73000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>101</th>\n",
" <td>102</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1238</td>\n",
" <td>71000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>102</th>\n",
" <td>103</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1830</td>\n",
" <td>71000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>103</th>\n",
" <td>104</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1657</td>\n",
" <td>78000</td>\n",
" <td>No</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>105</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>1817</td>\n",
" <td>74000</td>\n",
" <td>No</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>105</th>\n",
" <td>106</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1600</td>\n",
" <td>84500</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>106</th>\n",
" <td>107</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1396</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>108</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1380</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>109</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1350</td>\n",
" <td>90000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>110</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1310</td>\n",
" <td>87000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>111</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1462</td>\n",
" <td>94000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>112</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1069</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>113</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1221</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>114</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1775</td>\n",
" <td>90000</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>115</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1852</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>116</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1598</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>117</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1785</td>\n",
" <td>86000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>118</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1628</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>119</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1758</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>119</th>\n",
" <td>120</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1215</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>121</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1134</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>121</th>\n",
" <td>122</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1364</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>123</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1499</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>124</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1998</td>\n",
" <td>88000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>124</th>\n",
" <td>125</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1916</td>\n",
" <td>85500</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>125</th>\n",
" <td>126</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1152</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>127</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1086</td>\n",
" <td>92500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>128</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1207</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>129</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1047</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>129</th>\n",
" <td>130</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1162</td>\n",
" <td>88500</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>130</th>\n",
" <td>131</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1278</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" id child_gender child_age total_correct_responses correct_responses \\\n",
"79 80 1 4 10 10 \n",
"80 81 1 4 10 10 \n",
"81 82 1 4 10 10 \n",
"82 83 2 4 10 10 \n",
"83 84 2 4 10 9 \n",
"84 85 2 4 10 10 \n",
"85 86 2 4 10 8 \n",
"86 87 2 4 10 10 \n",
"87 88 2 4 10 8 \n",
"88 89 2 4 10 9 \n",
"89 90 2 4 10 10 \n",
"90 91 1 4 10 9 \n",
"91 92 1 4 10 10 \n",
"92 93 1 4 10 10 \n",
"93 94 1 4 10 10 \n",
"94 95 1 4 10 10 \n",
"95 96 1 4 10 10 \n",
"96 97 1 4 10 9 \n",
"97 98 1 4 10 10 \n",
"98 99 1 4 10 9 \n",
"99 100 1 4 10 7 \n",
"100 101 1 4 10 10 \n",
"101 102 1 4 10 10 \n",
"102 103 1 4 10 9 \n",
"103 104 1 4 10 8 \n",
"104 105 1 4 10 7 \n",
"105 106 2 5 12 11 \n",
"106 107 2 5 12 11 \n",
"107 108 2 5 12 12 \n",
"108 109 2 5 12 12 \n",
"109 110 2 5 12 12 \n",
"110 111 2 5 12 12 \n",
"111 112 1 5 12 12 \n",
"112 113 1 5 12 12 \n",
"113 114 1 5 12 10 \n",
"114 115 2 5 12 10 \n",
"115 116 2 5 12 11 \n",
"116 117 2 5 12 12 \n",
"117 118 2 5 12 12 \n",
"118 119 2 5 12 12 \n",
"119 120 2 5 12 12 \n",
"120 121 2 5 12 12 \n",
"121 122 2 5 12 11 \n",
"122 123 2 5 12 12 \n",
"123 124 2 5 12 12 \n",
"124 125 2 5 12 10 \n",
"125 126 2 5 12 12 \n",
"126 127 2 5 12 12 \n",
"127 128 2 5 12 12 \n",
"128 129 2 5 12 12 \n",
"129 130 2 5 12 10 \n",
"130 131 2 5 12 12 \n",
"\n",
" commission_errors omission_errors mean_reaction_time total_duration \\\n",
"79 0 0 1448 74000 \n",
"80 0 0 1331 78000 \n",
"81 0 0 1426 74500 \n",
"82 0 0 1632 76000 \n",
"83 0 1 1340 72000 \n",
"84 0 0 1564 76000 \n",
"85 0 2 1366 76000 \n",
"86 0 0 1291 74500 \n",
"87 0 2 2032 71500 \n",
"88 0 1 1789 74000 \n",
"89 0 0 1680 73500 \n",
"90 0 1 1317 67500 \n",
"91 0 0 1040 70500 \n",
"92 0 0 1142 75500 \n",
"93 0 0 1168 75000 \n",
"94 0 0 1150 77000 \n",
"95 0 0 1270 76000 \n",
"96 0 1 1457 73000 \n",
"97 0 0 1180 72500 \n",
"98 0 1 1261 73500 \n",
"99 0 3 1234 71500 \n",
"100 0 0 1165 73000 \n",
"101 0 0 1238 71000 \n",
"102 0 1 1830 71000 \n",
"103 0 2 1657 78000 \n",
"104 0 3 1817 74000 \n",
"105 0 1 1600 84500 \n",
"106 0 1 1396 86500 \n",
"107 0 0 1380 89000 \n",
"108 0 0 1350 90000 \n",
"109 0 0 1310 87000 \n",
"110 0 0 1462 94000 \n",
"111 0 0 1069 89000 \n",
"112 0 0 1221 92000 \n",
"113 0 2 1775 90000 \n",
"114 0 2 1852 89500 \n",
"115 0 1 1598 92000 \n",
"116 0 0 1785 86000 \n",
"117 0 0 1628 92000 \n",
"118 0 0 1758 86500 \n",
"119 0 0 1215 92000 \n",
"120 0 0 1134 89000 \n",
"121 0 1 1364 89000 \n",
"122 0 0 1499 89000 \n",
"123 0 0 1998 88000 \n",
"124 0 2 1916 85500 \n",
"125 0 0 1152 89500 \n",
"126 0 0 1086 92500 \n",
"127 0 0 1207 86500 \n",
"128 0 0 1047 92000 \n",
"129 0 2 1162 88500 \n",
"130 0 0 1278 89000 \n",
"\n",
" diagnosis percentage_no_of_correct_responses oer cer game \n",
"79 No 100.000000 0.000000 0.0 Focused \n",
"80 No 100.000000 0.000000 0.0 Focused \n",
"81 No 100.000000 0.000000 0.0 Focused \n",
"82 No 100.000000 0.000000 0.0 Focused \n",
"83 No 90.000000 10.000000 0.0 Focused \n",
"84 No 100.000000 0.000000 0.0 Focused \n",
"85 No 80.000000 20.000000 0.0 Focused \n",
"86 No 100.000000 0.000000 0.0 Focused \n",
"87 No 80.000000 20.000000 0.0 Focused \n",
"88 No 90.000000 10.000000 0.0 Focused \n",
"89 No 100.000000 0.000000 0.0 Focused \n",
"90 No 90.000000 10.000000 0.0 Focused \n",
"91 No 100.000000 0.000000 0.0 Focused \n",
"92 No 100.000000 0.000000 0.0 Focused \n",
"93 No 100.000000 0.000000 0.0 Focused \n",
"94 No 100.000000 0.000000 0.0 Focused \n",
"95 No 100.000000 0.000000 0.0 Focused \n",
"96 No 90.000000 10.000000 0.0 Focused \n",
"97 No 100.000000 0.000000 0.0 Focused \n",
"98 No 90.000000 10.000000 0.0 Focused \n",
"99 No 70.000000 30.000000 0.0 Focused \n",
"100 No 100.000000 0.000000 0.0 Focused \n",
"101 No 100.000000 0.000000 0.0 Focused \n",
"102 No 90.000000 10.000000 0.0 Focused \n",
"103 No 80.000000 20.000000 0.0 Focused \n",
"104 No 70.000000 30.000000 0.0 Focused \n",
"105 No 91.666667 8.333333 0.0 Focused \n",
"106 No 91.666667 8.333333 0.0 Focused \n",
"107 No 100.000000 0.000000 0.0 Focused \n",
"108 No 100.000000 0.000000 0.0 Focused \n",
"109 No 100.000000 0.000000 0.0 Focused \n",
"110 No 100.000000 0.000000 0.0 Focused \n",
"111 No 100.000000 0.000000 0.0 Focused \n",
"112 No 100.000000 0.000000 0.0 Focused \n",
"113 No 83.333333 16.666667 0.0 Focused \n",
"114 No 83.333333 16.666667 0.0 Focused \n",
"115 No 91.666667 8.333333 0.0 Focused \n",
"116 No 100.000000 0.000000 0.0 Focused \n",
"117 No 100.000000 0.000000 0.0 Focused \n",
"118 No 100.000000 0.000000 0.0 Focused \n",
"119 No 100.000000 0.000000 0.0 Focused \n",
"120 No 100.000000 0.000000 0.0 Focused \n",
"121 No 91.666667 8.333333 0.0 Focused \n",
"122 No 100.000000 0.000000 0.0 Focused \n",
"123 No 100.000000 0.000000 0.0 Focused \n",
"124 No 83.333333 16.666667 0.0 Focused \n",
"125 No 100.000000 0.000000 0.0 Focused \n",
"126 No 100.000000 0.000000 0.0 Focused \n",
"127 No 100.000000 0.000000 0.0 Focused \n",
"128 No 100.000000 0.000000 0.0 Focused \n",
"129 No 83.333333 16.666667 0.0 Focused \n",
"130 No 100.000000 0.000000 0.0 Focused "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Importing the dataset \n",
"dataset = pd.read_csv('data.csv') \n",
"dataset.drop(dataset.index[dataset['game'] == 'Alternating'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Sustained'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Selective'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Divided'], inplace = True)\n",
"\n",
"dataset.drop(dataset.index[dataset['child_age'] == 6], inplace = True)\n",
"dataset.drop(dataset.index[dataset['child_age'] == 7], inplace = True)\n",
"\n",
"display(dataset)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "12841129",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[1448. , 100. , 0. ],\n",
" [1331. , 100. , 0. ],\n",
" [1426. , 100. , 0. ],\n",
" [1632. , 100. , 0. ],\n",
" [1340. , 90. , 10. ],\n",
" [1564. , 100. , 0. ],\n",
" [1366. , 80. , 20. ],\n",
" [1291. , 100. , 0. ],\n",
" [2032. , 80. , 20. ],\n",
" [1789. , 90. , 10. ],\n",
" [1680. , 100. , 0. ],\n",
" [1317. , 90. , 10. ],\n",
" [1040. , 100. , 0. ],\n",
" [1142. , 100. , 0. ],\n",
" [1168. , 100. , 0. ],\n",
" [1150. , 100. , 0. ],\n",
" [1270. , 100. , 0. ],\n",
" [1457. , 90. , 10. ],\n",
" [1180. , 100. , 0. ],\n",
" [1261. , 90. , 10. ],\n",
" [1234. , 70. , 30. ],\n",
" [1165. , 100. , 0. ],\n",
" [1238. , 100. , 0. ],\n",
" [1830. , 90. , 10. ],\n",
" [1657. , 80. , 20. ],\n",
" [1817. , 70. , 30. ],\n",
" [1600. , 91.66666667, 8.33333333],\n",
" [1396. , 91.66666667, 8.33333333],\n",
" [1380. , 100. , 0. ],\n",
" [1350. , 100. , 0. ],\n",
" [1310. , 100. , 0. ],\n",
" [1462. , 100. , 0. ],\n",
" [1069. , 100. , 0. ],\n",
" [1221. , 100. , 0. ],\n",
" [1775. , 83.33333333, 16.66666667],\n",
" [1852. , 83.33333333, 16.66666667],\n",
" [1598. , 91.66666667, 8.33333333],\n",
" [1785. , 100. , 0. ],\n",
" [1628. , 100. , 0. ],\n",
" [1758. , 100. , 0. ],\n",
" [1215. , 100. , 0. ],\n",
" [1134. , 100. , 0. ],\n",
" [1364. , 91.66666667, 8.33333333],\n",
" [1499. , 100. , 0. ],\n",
" [1998. , 100. , 0. ],\n",
" [1916. , 83.33333333, 16.66666667],\n",
" [1152. , 100. , 0. ],\n",
" [1086. , 100. , 0. ],\n",
" [1207. , 100. , 0. ],\n",
" [1047. , 100. , 0. ],\n",
" [1162. , 83.33333333, 16.66666667],\n",
" [1278. , 100. , 0. ]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# extracting only 11-comission & 12-omission\n",
"x = dataset.iloc[:, [7, 10, 11]].values \n",
"display(x)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "d569e05b",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 0.08876077, 0.65810029, -0.65810029],\n",
" [-0.35063754, 0.65810029, -0.65810029],\n",
" [ 0.00613887, 0.65810029, -0.65810029],\n",
" [ 0.77978033, 0.65810029, -0.65810029],\n",
" [-0.31683767, -0.56408597, 0.56408597],\n",
" [ 0.52440354, 0.65810029, -0.65810029],\n",
" [-0.2191936 , -1.78627223, 1.78627223],\n",
" [-0.50085918, 0.65810029, -0.65810029],\n",
" [ 2.28199678, -1.78627223, 1.78627223],\n",
" [ 1.36940029, -0.56408597, 0.56408597],\n",
" [ 0.96004631, 0.65810029, -0.65810029],\n",
" [-0.40321512, -0.56408597, 0.56408597],\n",
" [-1.4435 , 0.65810029, -0.65810029],\n",
" [-1.06043481, 0.65810029, -0.65810029],\n",
" [-0.96279074, 0.65810029, -0.65810029],\n",
" [-1.03039048, 0.65810029, -0.65810029],\n",
" [-0.57972555, 0.65810029, -0.65810029],\n",
" [ 0.12256064, -0.56408597, 0.56408597],\n",
" [-0.91772425, 0.65810029, -0.65810029],\n",
" [-0.61352542, -0.56408597, 0.56408597],\n",
" [-0.71492503, -3.00845849, 3.00845849],\n",
" [-0.97405736, 0.65810029, -0.65810029],\n",
" [-0.69990286, 0.65810029, -0.65810029],\n",
" [ 1.52337747, -0.56408597, 0.56408597],\n",
" [ 0.87366886, -1.78627223, 1.78627223],\n",
" [ 1.47455544, -3.00845849, 3.00845849],\n",
" [ 0.65960302, -0.36038826, 0.36038826],\n",
" [-0.10652737, -0.36038826, 0.36038826],\n",
" [-0.16661603, 0.65810029, -0.65810029],\n",
" [-0.27928226, 0.65810029, -0.65810029],\n",
" [-0.4295039 , 0.65810029, -0.65810029],\n",
" [ 0.14133835, 0.65810029, -0.65810029],\n",
" [-1.33458931, 0.65810029, -0.65810029],\n",
" [-0.76374706, 0.65810029, -0.65810029],\n",
" [ 1.31682271, -1.37887681, 1.37887681],\n",
" [ 1.60599938, -1.37887681, 1.37887681],\n",
" [ 0.65209194, -0.36038826, 0.36038826],\n",
" [ 1.35437812, 0.65810029, -0.65810029],\n",
" [ 0.76475817, 0.65810029, -0.65810029],\n",
" [ 1.25297851, 0.65810029, -0.65810029],\n",
" [-0.78628031, 0.65810029, -0.65810029],\n",
" [-1.09047914, 0.65810029, -0.65810029],\n",
" [-0.22670468, -0.36038826, 0.36038826],\n",
" [ 0.28029337, 0.65810029, -0.65810029],\n",
" [ 2.15430838, 0.65810029, -0.65810029],\n",
" [ 1.84635401, -1.37887681, 1.37887681],\n",
" [-1.0228794 , 0.65810029, -0.65810029],\n",
" [-1.27074511, 0.65810029, -0.65810029],\n",
" [-0.81632464, 0.65810029, -0.65810029],\n",
" [-1.41721122, 0.65810029, -0.65810029],\n",
" [-0.98532399, -1.37887681, 1.37887681],\n",
" [-0.54968122, 0.65810029, -0.65810029]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# standardizing the data\n",
"from sklearn.preprocessing import StandardScaler\n",
"scaler = StandardScaler()\n",
"new_df = scaler.fit_transform(x)\n",
"\n",
"# statistics of scaled data\n",
"pd.DataFrame(new_df).describe()\n",
"\n",
"display(new_df)\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "b5fc4f60",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 4. , 0.08876077, 0.65810029, -0.65810029],\n",
" [ 4. , -0.35063754, 0.65810029, -0.65810029],\n",
" [ 4. , 0.00613887, 0.65810029, -0.65810029],\n",
" [ 4. , 0.77978033, 0.65810029, -0.65810029],\n",
" [ 4. , -0.31683767, -0.56408597, 0.56408597],\n",
" [ 4. , 0.52440354, 0.65810029, -0.65810029],\n",
" [ 4. , -0.2191936 , -1.78627223, 1.78627223],\n",
" [ 4. , -0.50085918, 0.65810029, -0.65810029],\n",
" [ 4. , 2.28199678, -1.78627223, 1.78627223],\n",
" [ 4. , 1.36940029, -0.56408597, 0.56408597],\n",
" [ 4. , 0.96004631, 0.65810029, -0.65810029],\n",
" [ 4. , -0.40321512, -0.56408597, 0.56408597],\n",
" [ 4. , -1.4435 , 0.65810029, -0.65810029],\n",
" [ 4. , -1.06043481, 0.65810029, -0.65810029],\n",
" [ 4. , -0.96279074, 0.65810029, -0.65810029],\n",
" [ 4. , -1.03039048, 0.65810029, -0.65810029],\n",
" [ 4. , -0.57972555, 0.65810029, -0.65810029],\n",
" [ 4. , 0.12256064, -0.56408597, 0.56408597],\n",
" [ 4. , -0.91772425, 0.65810029, -0.65810029],\n",
" [ 4. , -0.61352542, -0.56408597, 0.56408597],\n",
" [ 4. , -0.71492503, -3.00845849, 3.00845849],\n",
" [ 4. , -0.97405736, 0.65810029, -0.65810029],\n",
" [ 4. , -0.69990286, 0.65810029, -0.65810029],\n",
" [ 4. , 1.52337747, -0.56408597, 0.56408597],\n",
" [ 4. , 0.87366886, -1.78627223, 1.78627223],\n",
" [ 4. , 1.47455544, -3.00845849, 3.00845849],\n",
" [ 5. , 0.65960302, -0.36038826, 0.36038826],\n",
" [ 5. , -0.10652737, -0.36038826, 0.36038826],\n",
" [ 5. , -0.16661603, 0.65810029, -0.65810029],\n",
" [ 5. , -0.27928226, 0.65810029, -0.65810029],\n",
" [ 5. , -0.4295039 , 0.65810029, -0.65810029],\n",
" [ 5. , 0.14133835, 0.65810029, -0.65810029],\n",
" [ 5. , -1.33458931, 0.65810029, -0.65810029],\n",
" [ 5. , -0.76374706, 0.65810029, -0.65810029],\n",
" [ 5. , 1.31682271, -1.37887681, 1.37887681],\n",
" [ 5. , 1.60599938, -1.37887681, 1.37887681],\n",
" [ 5. , 0.65209194, -0.36038826, 0.36038826],\n",
" [ 5. , 1.35437812, 0.65810029, -0.65810029],\n",
" [ 5. , 0.76475817, 0.65810029, -0.65810029],\n",
" [ 5. , 1.25297851, 0.65810029, -0.65810029],\n",
" [ 5. , -0.78628031, 0.65810029, -0.65810029],\n",
" [ 5. , -1.09047914, 0.65810029, -0.65810029],\n",
" [ 5. , -0.22670468, -0.36038826, 0.36038826],\n",
" [ 5. , 0.28029337, 0.65810029, -0.65810029],\n",
" [ 5. , 2.15430838, 0.65810029, -0.65810029],\n",
" [ 5. , 1.84635401, -1.37887681, 1.37887681],\n",
" [ 5. , -1.0228794 , 0.65810029, -0.65810029],\n",
" [ 5. , -1.27074511, 0.65810029, -0.65810029],\n",
" [ 5. , -0.81632464, 0.65810029, -0.65810029],\n",
" [ 5. , -1.41721122, 0.65810029, -0.65810029],\n",
" [ 5. , -0.98532399, -1.37887681, 1.37887681],\n",
" [ 5. , -0.54968122, 0.65810029, -0.65810029]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"x = dataset.iloc[:, [2, 7, 10, 11]].copy()\n",
"x[['mean_reaction_time', 'percentage_no_of_correct_responses', 'oer']] = new_df\n",
"x.head()\n",
"x = x.to_numpy()\n",
"display(x)\n"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "5d1c61bf",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"[0 1 2 3]\n"
]
}
],
"source": [
"from sklearn.cluster import Birch\n",
"\n",
"# define the model\n",
"model = Birch(threshold=0.01, n_clusters=4)\n",
"# fit the model\n",
"model.fit(x)\n",
"# assign a cluster to each example\n",
"yhat = model.predict(x)\n",
"# retrieve unique clusters\n",
"clusters = unique(yhat)\n",
"print(clusters)"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "2e691585",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>79</th>\n",
" <td>4</td>\n",
" <td>1448</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>4</td>\n",
" <td>1331</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>81</th>\n",
" <td>4</td>\n",
" <td>1426</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>4</td>\n",
" <td>1632</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>83</th>\n",
" <td>4</td>\n",
" <td>1340</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>4</td>\n",
" <td>1564</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>85</th>\n",
" <td>4</td>\n",
" <td>1366</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>86</th>\n",
" <td>4</td>\n",
" <td>1291</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>87</th>\n",
" <td>4</td>\n",
" <td>2032</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>88</th>\n",
" <td>4</td>\n",
" <td>1789</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>4</td>\n",
" <td>1680</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>90</th>\n",
" <td>4</td>\n",
" <td>1317</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>91</th>\n",
" <td>4</td>\n",
" <td>1040</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>92</th>\n",
" <td>4</td>\n",
" <td>1142</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>93</th>\n",
" <td>4</td>\n",
" <td>1168</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>94</th>\n",
" <td>4</td>\n",
" <td>1150</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>95</th>\n",
" <td>4</td>\n",
" <td>1270</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>96</th>\n",
" <td>4</td>\n",
" <td>1457</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>97</th>\n",
" <td>4</td>\n",
" <td>1180</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>98</th>\n",
" <td>4</td>\n",
" <td>1261</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>99</th>\n",
" <td>4</td>\n",
" <td>1234</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>100</th>\n",
" <td>4</td>\n",
" <td>1165</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>101</th>\n",
" <td>4</td>\n",
" <td>1238</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>102</th>\n",
" <td>4</td>\n",
" <td>1830</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>103</th>\n",
" <td>4</td>\n",
" <td>1657</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>4</td>\n",
" <td>1817</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>105</th>\n",
" <td>5</td>\n",
" <td>1600</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>106</th>\n",
" <td>5</td>\n",
" <td>1396</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>5</td>\n",
" <td>1380</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>5</td>\n",
" <td>1350</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>5</td>\n",
" <td>1310</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>5</td>\n",
" <td>1462</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>5</td>\n",
" <td>1069</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>5</td>\n",
" <td>1221</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>5</td>\n",
" <td>1775</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>5</td>\n",
" <td>1852</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>5</td>\n",
" <td>1598</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>5</td>\n",
" <td>1785</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>5</td>\n",
" <td>1628</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>5</td>\n",
" <td>1758</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>119</th>\n",
" <td>5</td>\n",
" <td>1215</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>5</td>\n",
" <td>1134</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>121</th>\n",
" <td>5</td>\n",
" <td>1364</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>5</td>\n",
" <td>1499</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>5</td>\n",
" <td>1998</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>124</th>\n",
" <td>5</td>\n",
" <td>1916</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>125</th>\n",
" <td>5</td>\n",
" <td>1152</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>5</td>\n",
" <td>1086</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>5</td>\n",
" <td>1207</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>5</td>\n",
" <td>1047</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>129</th>\n",
" <td>5</td>\n",
" <td>1162</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>130</th>\n",
" <td>5</td>\n",
" <td>1278</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"79 4 1448 100.000000 \n",
"80 4 1331 100.000000 \n",
"81 4 1426 100.000000 \n",
"82 4 1632 100.000000 \n",
"83 4 1340 90.000000 \n",
"84 4 1564 100.000000 \n",
"85 4 1366 80.000000 \n",
"86 4 1291 100.000000 \n",
"87 4 2032 80.000000 \n",
"88 4 1789 90.000000 \n",
"89 4 1680 100.000000 \n",
"90 4 1317 90.000000 \n",
"91 4 1040 100.000000 \n",
"92 4 1142 100.000000 \n",
"93 4 1168 100.000000 \n",
"94 4 1150 100.000000 \n",
"95 4 1270 100.000000 \n",
"96 4 1457 90.000000 \n",
"97 4 1180 100.000000 \n",
"98 4 1261 90.000000 \n",
"99 4 1234 70.000000 \n",
"100 4 1165 100.000000 \n",
"101 4 1238 100.000000 \n",
"102 4 1830 90.000000 \n",
"103 4 1657 80.000000 \n",
"104 4 1817 70.000000 \n",
"105 5 1600 91.666667 \n",
"106 5 1396 91.666667 \n",
"107 5 1380 100.000000 \n",
"108 5 1350 100.000000 \n",
"109 5 1310 100.000000 \n",
"110 5 1462 100.000000 \n",
"111 5 1069 100.000000 \n",
"112 5 1221 100.000000 \n",
"113 5 1775 83.333333 \n",
"114 5 1852 83.333333 \n",
"115 5 1598 91.666667 \n",
"116 5 1785 100.000000 \n",
"117 5 1628 100.000000 \n",
"118 5 1758 100.000000 \n",
"119 5 1215 100.000000 \n",
"120 5 1134 100.000000 \n",
"121 5 1364 91.666667 \n",
"122 5 1499 100.000000 \n",
"123 5 1998 100.000000 \n",
"124 5 1916 83.333333 \n",
"125 5 1152 100.000000 \n",
"126 5 1086 100.000000 \n",
"127 5 1207 100.000000 \n",
"128 5 1047 100.000000 \n",
"129 5 1162 83.333333 \n",
"130 5 1278 100.000000 \n",
"\n",
" oer clusters \n",
"79 0.000000 2 \n",
"80 0.000000 2 \n",
"81 0.000000 2 \n",
"82 0.000000 1 \n",
"83 10.000000 3 \n",
"84 0.000000 1 \n",
"85 20.000000 0 \n",
"86 0.000000 2 \n",
"87 20.000000 0 \n",
"88 10.000000 0 \n",
"89 0.000000 1 \n",
"90 10.000000 3 \n",
"91 0.000000 2 \n",
"92 0.000000 2 \n",
"93 0.000000 2 \n",
"94 0.000000 2 \n",
"95 0.000000 2 \n",
"96 10.000000 3 \n",
"97 0.000000 2 \n",
"98 10.000000 3 \n",
"99 30.000000 0 \n",
"100 0.000000 2 \n",
"101 0.000000 2 \n",
"102 10.000000 0 \n",
"103 20.000000 0 \n",
"104 30.000000 0 \n",
"105 8.333333 3 \n",
"106 8.333333 3 \n",
"107 0.000000 2 \n",
"108 0.000000 2 \n",
"109 0.000000 2 \n",
"110 0.000000 2 \n",
"111 0.000000 2 \n",
"112 0.000000 2 \n",
"113 16.666667 0 \n",
"114 16.666667 0 \n",
"115 8.333333 3 \n",
"116 0.000000 1 \n",
"117 0.000000 1 \n",
"118 0.000000 1 \n",
"119 0.000000 2 \n",
"120 0.000000 2 \n",
"121 8.333333 3 \n",
"122 0.000000 2 \n",
"123 0.000000 1 \n",
"124 16.666667 0 \n",
"125 0.000000 2 \n",
"126 0.000000 2 \n",
"127 0.000000 2 \n",
"128 0.000000 2 \n",
"129 16.666667 0 \n",
"130 0.000000 2 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"new_df = dataset.iloc[:, [2, 7, 10, 11]].copy()\n",
"new_df['clusters'] = yhat\n",
"new_df.head()\n",
"display(new_df)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "50a9adbb",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Silhouette Coefficient: 0.401\n",
"Calinski-Harabasz Index: 41.707\n",
"Davies-Bouldin Index: 0.932\n"
]
}
],
"source": [
"from sklearn.metrics import silhouette_score,calinski_harabasz_score,davies_bouldin_score\n",
"\n",
"print(\"Silhouette Coefficient: %0.3f\" % silhouette_score(x, yhat))\n",
"print(\"Calinski-Harabasz Index: %0.3f\" % calinski_harabasz_score(x, yhat))\n",
"print(\"Davies-Bouldin Index: %0.3f\" % davies_bouldin_score(x, yhat))"
]
},
{
"cell_type": "markdown",
"id": "900a0d3f",
"metadata": {},
"source": [
"# Cluster Analysis"
]
},
{
"cell_type": "markdown",
"id": "262e8a4f",
"metadata": {},
"source": [
"## Cluster 1"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "ba8fef3b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"11"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 0])"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "6c5b7397",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>85</th>\n",
" <td>4</td>\n",
" <td>1366</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>87</th>\n",
" <td>4</td>\n",
" <td>2032</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>88</th>\n",
" <td>4</td>\n",
" <td>1789</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>99</th>\n",
" <td>4</td>\n",
" <td>1234</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>102</th>\n",
" <td>4</td>\n",
" <td>1830</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>103</th>\n",
" <td>4</td>\n",
" <td>1657</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>4</td>\n",
" <td>1817</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>5</td>\n",
" <td>1775</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>5</td>\n",
" <td>1852</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>124</th>\n",
" <td>5</td>\n",
" <td>1916</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>129</th>\n",
" <td>5</td>\n",
" <td>1162</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"85 4 1366 80.000000 \n",
"87 4 2032 80.000000 \n",
"88 4 1789 90.000000 \n",
"99 4 1234 70.000000 \n",
"102 4 1830 90.000000 \n",
"103 4 1657 80.000000 \n",
"104 4 1817 70.000000 \n",
"113 5 1775 83.333333 \n",
"114 5 1852 83.333333 \n",
"124 5 1916 83.333333 \n",
"129 5 1162 83.333333 \n",
"\n",
" oer clusters \n",
"85 20.000000 0 \n",
"87 20.000000 0 \n",
"88 10.000000 0 \n",
"99 30.000000 0 \n",
"102 10.000000 0 \n",
"103 20.000000 0 \n",
"104 30.000000 0 \n",
"113 16.666667 0 \n",
"114 16.666667 0 \n",
"124 16.666667 0 \n",
"129 16.666667 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"display(cluster_0)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "849d9447",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 1162\n",
"mean_reaction_time max - 2032\n",
"\n",
"percentage_no_of_correct_responses min - 70.0\n",
"percentage_no_of_correct_responses max - 90.0\n",
"\n",
"oer min - 10.0\n",
"oer max - 30.0\n"
]
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"\n",
"maxVal = cluster_0['mean_reaction_time'].max()\n",
"minVal = cluster_0['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_0['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['oer'].max()\n",
"minVal = cluster_0['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "dd8d7e4f",
"metadata": {},
"source": [
"## Cluster 2"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "f9ed816e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"7"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 1])"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "e3eeb500",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>4</td>\n",
" <td>1632</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>4</td>\n",
" <td>1564</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>4</td>\n",
" <td>1680</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>5</td>\n",
" <td>1785</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>5</td>\n",
" <td>1628</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>5</td>\n",
" <td>1758</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>5</td>\n",
" <td>1998</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses oer \\\n",
"82 4 1632 100.0 0.0 \n",
"84 4 1564 100.0 0.0 \n",
"89 4 1680 100.0 0.0 \n",
"116 5 1785 100.0 0.0 \n",
"117 5 1628 100.0 0.0 \n",
"118 5 1758 100.0 0.0 \n",
"123 5 1998 100.0 0.0 \n",
"\n",
" clusters \n",
"82 1 \n",
"84 1 \n",
"89 1 \n",
"116 1 \n",
"117 1 \n",
"118 1 \n",
"123 1 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"display(cluster_1)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "bb910e6a",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 1564\n",
"mean_reaction_time max - 1998\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n"
]
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"\n",
"maxVal = cluster_1['mean_reaction_time'].max()\n",
"minVal = cluster_1['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_1['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['oer'].max()\n",
"minVal = cluster_1['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "e7f55f44",
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"id": "3c84eacb",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
This source diff could not be displayed because it is too large. You can view the blob instead.
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "bcdc5589",
"metadata": {},
"outputs": [],
"source": [
"# importing libraries \n",
"import numpy as nm \n",
"import matplotlib.pyplot as mtp \n",
"import pandas as pd \n",
"from sklearn.cluster import DBSCAN\n",
"from numpy import unique\n",
"from numpy import where\n",
"from matplotlib import pyplot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "f448f999",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>child_gender</th>\n",
" <th>child_age</th>\n",
" <th>total_correct_responses</th>\n",
" <th>correct_responses</th>\n",
" <th>commission_errors</th>\n",
" <th>omission_errors</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>total_duration</th>\n",
" <th>diagnosis</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>game</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>131</th>\n",
" <td>132</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1041</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>132</th>\n",
" <td>133</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1298</td>\n",
" <td>87000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>133</th>\n",
" <td>134</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1080</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>134</th>\n",
" <td>135</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1284</td>\n",
" <td>88000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>135</th>\n",
" <td>136</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1140</td>\n",
" <td>88000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>136</th>\n",
" <td>137</td>\n",
" <td>1</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1125</td>\n",
" <td>90000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>137</th>\n",
" <td>138</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>819</td>\n",
" <td>84000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>138</th>\n",
" <td>139</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>783</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>139</th>\n",
" <td>140</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>901</td>\n",
" <td>85000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>140</th>\n",
" <td>141</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>976</td>\n",
" <td>88500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>141</th>\n",
" <td>142</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>826</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>142</th>\n",
" <td>143</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>855</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>143</th>\n",
" <td>144</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>885</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>144</th>\n",
" <td>145</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1031</td>\n",
" <td>91000</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>146</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1082</td>\n",
" <td>86000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>147</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1061</td>\n",
" <td>83000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>148</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1374</td>\n",
" <td>85000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>149</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>940</td>\n",
" <td>86000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>150</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1071</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>150</th>\n",
" <td>151</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1102</td>\n",
" <td>85500</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>151</th>\n",
" <td>152</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1146</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>152</th>\n",
" <td>153</td>\n",
" <td>2</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>792</td>\n",
" <td>87000</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>153</th>\n",
" <td>154</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1070</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>154</th>\n",
" <td>155</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1087</td>\n",
" <td>86000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>155</th>\n",
" <td>156</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1230</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>156</th>\n",
" <td>157</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1128</td>\n",
" <td>90000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>157</th>\n",
" <td>158</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>814</td>\n",
" <td>87000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>158</th>\n",
" <td>159</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1326</td>\n",
" <td>85000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>159</th>\n",
" <td>160</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1298</td>\n",
" <td>91000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" id child_gender child_age total_correct_responses correct_responses \\\n",
"131 132 2 6 12 12 \n",
"132 133 2 6 12 12 \n",
"133 134 2 6 12 12 \n",
"134 135 1 6 12 12 \n",
"135 136 1 6 12 12 \n",
"136 137 1 6 12 12 \n",
"137 138 2 6 12 12 \n",
"138 139 2 6 12 12 \n",
"139 140 2 6 12 12 \n",
"140 141 2 6 12 12 \n",
"141 142 2 6 12 11 \n",
"142 143 2 6 12 12 \n",
"143 144 2 6 12 12 \n",
"144 145 2 6 12 11 \n",
"145 146 2 7 12 12 \n",
"146 147 2 7 12 12 \n",
"147 148 2 7 12 12 \n",
"148 149 2 7 12 12 \n",
"149 150 2 7 12 12 \n",
"150 151 2 7 12 11 \n",
"151 152 2 7 12 12 \n",
"152 153 2 7 12 10 \n",
"153 154 1 7 12 12 \n",
"154 155 1 7 12 12 \n",
"155 156 1 7 12 12 \n",
"156 157 1 7 12 12 \n",
"157 158 1 7 12 12 \n",
"158 159 1 7 12 12 \n",
"159 160 1 7 12 12 \n",
"\n",
" commission_errors omission_errors mean_reaction_time total_duration \\\n",
"131 0 0 1041 89000 \n",
"132 0 0 1298 87000 \n",
"133 0 0 1080 86500 \n",
"134 0 0 1284 88000 \n",
"135 0 0 1140 88000 \n",
"136 0 0 1125 90000 \n",
"137 0 0 819 84000 \n",
"138 0 0 783 89500 \n",
"139 0 0 901 85000 \n",
"140 0 0 976 88500 \n",
"141 0 1 826 89500 \n",
"142 0 0 855 89500 \n",
"143 0 0 885 86500 \n",
"144 0 1 1031 91000 \n",
"145 0 0 1082 86000 \n",
"146 0 0 1061 83000 \n",
"147 0 0 1374 85000 \n",
"148 0 0 940 86000 \n",
"149 0 0 1071 86500 \n",
"150 0 1 1102 85500 \n",
"151 0 0 1146 86500 \n",
"152 0 2 792 87000 \n",
"153 0 0 1070 89500 \n",
"154 0 0 1087 86000 \n",
"155 0 0 1230 89500 \n",
"156 0 0 1128 90000 \n",
"157 0 0 814 87000 \n",
"158 0 0 1326 85000 \n",
"159 0 0 1298 91000 \n",
"\n",
" diagnosis percentage_no_of_correct_responses oer cer game \n",
"131 No 100.000000 0.000000 0.0 Focused \n",
"132 No 100.000000 0.000000 0.0 Focused \n",
"133 No 100.000000 0.000000 0.0 Focused \n",
"134 No 100.000000 0.000000 0.0 Focused \n",
"135 No 100.000000 0.000000 0.0 Focused \n",
"136 No 100.000000 0.000000 0.0 Focused \n",
"137 No 100.000000 0.000000 0.0 Focused \n",
"138 No 100.000000 0.000000 0.0 Focused \n",
"139 No 100.000000 0.000000 0.0 Focused \n",
"140 No 100.000000 0.000000 0.0 Focused \n",
"141 No 91.666667 8.333333 0.0 Focused \n",
"142 No 100.000000 0.000000 0.0 Focused \n",
"143 No 100.000000 0.000000 0.0 Focused \n",
"144 No 91.666667 8.333333 0.0 Focused \n",
"145 No 100.000000 0.000000 0.0 Focused \n",
"146 No 100.000000 0.000000 0.0 Focused \n",
"147 No 100.000000 0.000000 0.0 Focused \n",
"148 No 100.000000 0.000000 0.0 Focused \n",
"149 No 100.000000 0.000000 0.0 Focused \n",
"150 No 91.666667 8.333333 0.0 Focused \n",
"151 No 100.000000 0.000000 0.0 Focused \n",
"152 No 83.333333 16.666667 0.0 Focused \n",
"153 No 100.000000 0.000000 0.0 Focused \n",
"154 No 100.000000 0.000000 0.0 Focused \n",
"155 No 100.000000 0.000000 0.0 Focused \n",
"156 No 100.000000 0.000000 0.0 Focused \n",
"157 No 100.000000 0.000000 0.0 Focused \n",
"158 No 100.000000 0.000000 0.0 Focused \n",
"159 No 100.000000 0.000000 0.0 Focused "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Importing the dataset \n",
"dataset = pd.read_csv('data.csv') \n",
"dataset.drop(dataset.index[dataset['game'] == 'Alternating'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Sustained'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Selective'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Divided'], inplace = True)\n",
"\n",
"dataset.drop(dataset.index[dataset['child_age'] == 4], inplace = True)\n",
"dataset.drop(dataset.index[dataset['child_age'] == 5], inplace = True)\n",
"\n",
"display(dataset)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "12841129",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[1041. , 100. , 0. ],\n",
" [1298. , 100. , 0. ],\n",
" [1080. , 100. , 0. ],\n",
" [1284. , 100. , 0. ],\n",
" [1140. , 100. , 0. ],\n",
" [1125. , 100. , 0. ],\n",
" [ 819. , 100. , 0. ],\n",
" [ 783. , 100. , 0. ],\n",
" [ 901. , 100. , 0. ],\n",
" [ 976. , 100. , 0. ],\n",
" [ 826. , 91.66666667, 8.33333333],\n",
" [ 855. , 100. , 0. ],\n",
" [ 885. , 100. , 0. ],\n",
" [1031. , 91.66666667, 8.33333333],\n",
" [1082. , 100. , 0. ],\n",
" [1061. , 100. , 0. ],\n",
" [1374. , 100. , 0. ],\n",
" [ 940. , 100. , 0. ],\n",
" [1071. , 100. , 0. ],\n",
" [1102. , 91.66666667, 8.33333333],\n",
" [1146. , 100. , 0. ],\n",
" [ 792. , 83.33333333, 16.66666667],\n",
" [1070. , 100. , 0. ],\n",
" [1087. , 100. , 0. ],\n",
" [1230. , 100. , 0. ],\n",
" [1128. , 100. , 0. ],\n",
" [ 814. , 100. , 0. ],\n",
" [1326. , 100. , 0. ],\n",
" [1298. , 100. , 0. ]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# extracting only 11-comission & 12-omission\n",
"x = dataset.iloc[:, [7, 10, 11]].values \n",
"display(x)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "d569e05b",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[-0.07666676, 0.37476584, -0.37476584],\n",
" [ 1.44300705, 0.37476584, -0.37476584],\n",
" [ 0.15394522, 0.37476584, -0.37476584],\n",
" [ 1.36022326, 0.37476584, -0.37476584],\n",
" [ 0.50873288, 0.37476584, -0.37476584],\n",
" [ 0.42003596, 0.37476584, -0.37476584],\n",
" [-1.3893811 , 0.37476584, -0.37476584],\n",
" [-1.60225369, 0.37476584, -0.37476584],\n",
" [-0.90450463, 0.37476584, -0.37476584],\n",
" [-0.46102006, 0.37476584, -0.37476584],\n",
" [-1.3479892 , -1.79887605, 1.79887605],\n",
" [-1.1765085 , 0.37476584, -0.37476584],\n",
" [-0.99911467, 0.37476584, -0.37476584],\n",
" [-0.13579803, -1.79887605, 1.79887605],\n",
" [ 0.16577148, 0.37476584, -0.37476584],\n",
" [ 0.04159579, 0.37476584, -0.37476584],\n",
" [ 1.89240475, 0.37476584, -0.37476584],\n",
" [-0.67389265, 0.37476584, -0.37476584],\n",
" [ 0.10072707, 0.37476584, -0.37476584],\n",
" [ 0.28403403, -1.79887605, 1.79887605],\n",
" [ 0.54421164, 0.37476584, -0.37476584],\n",
" [-1.54903554, -3.97251795, 3.97251795],\n",
" [ 0.09481394, 0.37476584, -0.37476584],\n",
" [ 0.19533711, 0.37476584, -0.37476584],\n",
" [ 1.04091437, 0.37476584, -0.37476584],\n",
" [ 0.43777535, 0.37476584, -0.37476584],\n",
" [-1.41894673, 0.37476584, -0.37476584],\n",
" [ 1.60857462, 0.37476584, -0.37476584],\n",
" [ 1.44300705, 0.37476584, -0.37476584]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# standardizing the data\n",
"from sklearn.preprocessing import StandardScaler\n",
"scaler = StandardScaler()\n",
"new_df = scaler.fit_transform(x)\n",
"\n",
"# statistics of scaled data\n",
"pd.DataFrame(new_df).describe()\n",
"\n",
"display(new_df)\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "b5fc4f60",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 6. , -0.07666676, 0.37476584, -0.37476584],\n",
" [ 6. , 1.44300705, 0.37476584, -0.37476584],\n",
" [ 6. , 0.15394522, 0.37476584, -0.37476584],\n",
" [ 6. , 1.36022326, 0.37476584, -0.37476584],\n",
" [ 6. , 0.50873288, 0.37476584, -0.37476584],\n",
" [ 6. , 0.42003596, 0.37476584, -0.37476584],\n",
" [ 6. , -1.3893811 , 0.37476584, -0.37476584],\n",
" [ 6. , -1.60225369, 0.37476584, -0.37476584],\n",
" [ 6. , -0.90450463, 0.37476584, -0.37476584],\n",
" [ 6. , -0.46102006, 0.37476584, -0.37476584],\n",
" [ 6. , -1.3479892 , -1.79887605, 1.79887605],\n",
" [ 6. , -1.1765085 , 0.37476584, -0.37476584],\n",
" [ 6. , -0.99911467, 0.37476584, -0.37476584],\n",
" [ 6. , -0.13579803, -1.79887605, 1.79887605],\n",
" [ 7. , 0.16577148, 0.37476584, -0.37476584],\n",
" [ 7. , 0.04159579, 0.37476584, -0.37476584],\n",
" [ 7. , 1.89240475, 0.37476584, -0.37476584],\n",
" [ 7. , -0.67389265, 0.37476584, -0.37476584],\n",
" [ 7. , 0.10072707, 0.37476584, -0.37476584],\n",
" [ 7. , 0.28403403, -1.79887605, 1.79887605],\n",
" [ 7. , 0.54421164, 0.37476584, -0.37476584],\n",
" [ 7. , -1.54903554, -3.97251795, 3.97251795],\n",
" [ 7. , 0.09481394, 0.37476584, -0.37476584],\n",
" [ 7. , 0.19533711, 0.37476584, -0.37476584],\n",
" [ 7. , 1.04091437, 0.37476584, -0.37476584],\n",
" [ 7. , 0.43777535, 0.37476584, -0.37476584],\n",
" [ 7. , -1.41894673, 0.37476584, -0.37476584],\n",
" [ 7. , 1.60857462, 0.37476584, -0.37476584],\n",
" [ 7. , 1.44300705, 0.37476584, -0.37476584]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"x = dataset.iloc[:, [2, 7, 10, 11]].copy()\n",
"x[['mean_reaction_time', 'percentage_no_of_correct_responses', 'oer']] = new_df\n",
"x.head()\n",
"x = x.to_numpy()\n",
"display(x)\n"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "58284e31",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Finding the optimal number of clusters using the elbow method\n",
"from sklearn.cluster import KMeans \n",
"wcss_list= [] #Initializing the list for the values of WCSS \n",
" \n",
"#Using for loop for iterations from 1 to 10. \n",
"for i in range(1, 11): \n",
" kmeans = KMeans(n_clusters=i, init='k-means++', random_state= 42) \n",
" kmeans.fit(x) \n",
" wcss_list.append(kmeans.inertia_) \n",
"mtp.plot(range(1, 11), wcss_list) \n",
"mtp.title('The Elobw Method Graph') \n",
"mtp.xlabel('Number of clusters(k)') \n",
"mtp.ylabel('wcss_list') \n",
"mtp.show()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "5d1c61bf",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"[0 0 0 0 0 0 0 0 0 0 1 0 0 1 0 0 0 0 0 1 0 1 0 0 0 0 0 0 0]\n"
]
}
],
"source": [
"#training the K-means model on a dataset \n",
"kmeans = KMeans(n_clusters=2, init='k-means++', random_state= 42) \n",
"y_predict= kmeans.fit_predict(x) \n",
"print(y_predict)"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "2e691585",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>131</th>\n",
" <td>6</td>\n",
" <td>1041</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>132</th>\n",
" <td>6</td>\n",
" <td>1298</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>133</th>\n",
" <td>6</td>\n",
" <td>1080</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>134</th>\n",
" <td>6</td>\n",
" <td>1284</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>135</th>\n",
" <td>6</td>\n",
" <td>1140</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>136</th>\n",
" <td>6</td>\n",
" <td>1125</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>137</th>\n",
" <td>6</td>\n",
" <td>819</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>138</th>\n",
" <td>6</td>\n",
" <td>783</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>139</th>\n",
" <td>6</td>\n",
" <td>901</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>140</th>\n",
" <td>6</td>\n",
" <td>976</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>141</th>\n",
" <td>6</td>\n",
" <td>826</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>142</th>\n",
" <td>6</td>\n",
" <td>855</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>143</th>\n",
" <td>6</td>\n",
" <td>885</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>144</th>\n",
" <td>6</td>\n",
" <td>1031</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>7</td>\n",
" <td>1082</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>7</td>\n",
" <td>1061</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>7</td>\n",
" <td>1374</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>7</td>\n",
" <td>940</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>7</td>\n",
" <td>1071</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>150</th>\n",
" <td>7</td>\n",
" <td>1102</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>151</th>\n",
" <td>7</td>\n",
" <td>1146</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>152</th>\n",
" <td>7</td>\n",
" <td>792</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>153</th>\n",
" <td>7</td>\n",
" <td>1070</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>154</th>\n",
" <td>7</td>\n",
" <td>1087</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>155</th>\n",
" <td>7</td>\n",
" <td>1230</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>156</th>\n",
" <td>7</td>\n",
" <td>1128</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>157</th>\n",
" <td>7</td>\n",
" <td>814</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>158</th>\n",
" <td>7</td>\n",
" <td>1326</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>159</th>\n",
" <td>7</td>\n",
" <td>1298</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"131 6 1041 100.000000 \n",
"132 6 1298 100.000000 \n",
"133 6 1080 100.000000 \n",
"134 6 1284 100.000000 \n",
"135 6 1140 100.000000 \n",
"136 6 1125 100.000000 \n",
"137 6 819 100.000000 \n",
"138 6 783 100.000000 \n",
"139 6 901 100.000000 \n",
"140 6 976 100.000000 \n",
"141 6 826 91.666667 \n",
"142 6 855 100.000000 \n",
"143 6 885 100.000000 \n",
"144 6 1031 91.666667 \n",
"145 7 1082 100.000000 \n",
"146 7 1061 100.000000 \n",
"147 7 1374 100.000000 \n",
"148 7 940 100.000000 \n",
"149 7 1071 100.000000 \n",
"150 7 1102 91.666667 \n",
"151 7 1146 100.000000 \n",
"152 7 792 83.333333 \n",
"153 7 1070 100.000000 \n",
"154 7 1087 100.000000 \n",
"155 7 1230 100.000000 \n",
"156 7 1128 100.000000 \n",
"157 7 814 100.000000 \n",
"158 7 1326 100.000000 \n",
"159 7 1298 100.000000 \n",
"\n",
" oer clusters \n",
"131 0.000000 0 \n",
"132 0.000000 0 \n",
"133 0.000000 0 \n",
"134 0.000000 0 \n",
"135 0.000000 0 \n",
"136 0.000000 0 \n",
"137 0.000000 0 \n",
"138 0.000000 0 \n",
"139 0.000000 0 \n",
"140 0.000000 0 \n",
"141 8.333333 1 \n",
"142 0.000000 0 \n",
"143 0.000000 0 \n",
"144 8.333333 1 \n",
"145 0.000000 0 \n",
"146 0.000000 0 \n",
"147 0.000000 0 \n",
"148 0.000000 0 \n",
"149 0.000000 0 \n",
"150 8.333333 1 \n",
"151 0.000000 0 \n",
"152 16.666667 1 \n",
"153 0.000000 0 \n",
"154 0.000000 0 \n",
"155 0.000000 0 \n",
"156 0.000000 0 \n",
"157 0.000000 0 \n",
"158 0.000000 0 \n",
"159 0.000000 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"new_df = dataset.iloc[:, [2, 7, 10, 11]].copy()\n",
"new_df['clusters'] = y_predict\n",
"new_df.head()\n",
"display(new_df)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "22e58322",
"metadata": {},
"outputs": [],
"source": [
"# save the model to disk\n",
"import pickle\n",
"filename = 'modelfa2.sav'\n",
"pickle.dump(kmeans, open(filename, 'wb'))"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "358178a6",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Silhouette Coefficient: 0.628\n",
"Calinski-Harabasz Index: 34.856\n",
"Davies-Bouldin Index: 0.641\n"
]
}
],
"source": [
"from sklearn.metrics import silhouette_score,calinski_harabasz_score,davies_bouldin_score\n",
"\n",
"print(\"Silhouette Coefficient: %0.3f\" % silhouette_score(x, y_predict))\n",
"print(\"Calinski-Harabasz Index: %0.3f\" % calinski_harabasz_score(x, y_predict))\n",
"print(\"Davies-Bouldin Index: %0.3f\" % davies_bouldin_score(x, y_predict))"
]
},
{
"cell_type": "markdown",
"id": "900a0d3f",
"metadata": {},
"source": [
"# Cluster Analysis"
]
},
{
"cell_type": "markdown",
"id": "262e8a4f",
"metadata": {},
"source": [
"## Cluster 1"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "ba8fef3b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"25"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 0])"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "6c5b7397",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>131</th>\n",
" <td>6</td>\n",
" <td>1041</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>132</th>\n",
" <td>6</td>\n",
" <td>1298</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>133</th>\n",
" <td>6</td>\n",
" <td>1080</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>134</th>\n",
" <td>6</td>\n",
" <td>1284</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>135</th>\n",
" <td>6</td>\n",
" <td>1140</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>136</th>\n",
" <td>6</td>\n",
" <td>1125</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>137</th>\n",
" <td>6</td>\n",
" <td>819</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>138</th>\n",
" <td>6</td>\n",
" <td>783</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>139</th>\n",
" <td>6</td>\n",
" <td>901</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>140</th>\n",
" <td>6</td>\n",
" <td>976</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>142</th>\n",
" <td>6</td>\n",
" <td>855</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>143</th>\n",
" <td>6</td>\n",
" <td>885</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>7</td>\n",
" <td>1082</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>7</td>\n",
" <td>1061</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>7</td>\n",
" <td>1374</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>7</td>\n",
" <td>940</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>7</td>\n",
" <td>1071</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>151</th>\n",
" <td>7</td>\n",
" <td>1146</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>153</th>\n",
" <td>7</td>\n",
" <td>1070</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>154</th>\n",
" <td>7</td>\n",
" <td>1087</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>155</th>\n",
" <td>7</td>\n",
" <td>1230</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>156</th>\n",
" <td>7</td>\n",
" <td>1128</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>157</th>\n",
" <td>7</td>\n",
" <td>814</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>158</th>\n",
" <td>7</td>\n",
" <td>1326</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>159</th>\n",
" <td>7</td>\n",
" <td>1298</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses oer \\\n",
"131 6 1041 100.0 0.0 \n",
"132 6 1298 100.0 0.0 \n",
"133 6 1080 100.0 0.0 \n",
"134 6 1284 100.0 0.0 \n",
"135 6 1140 100.0 0.0 \n",
"136 6 1125 100.0 0.0 \n",
"137 6 819 100.0 0.0 \n",
"138 6 783 100.0 0.0 \n",
"139 6 901 100.0 0.0 \n",
"140 6 976 100.0 0.0 \n",
"142 6 855 100.0 0.0 \n",
"143 6 885 100.0 0.0 \n",
"145 7 1082 100.0 0.0 \n",
"146 7 1061 100.0 0.0 \n",
"147 7 1374 100.0 0.0 \n",
"148 7 940 100.0 0.0 \n",
"149 7 1071 100.0 0.0 \n",
"151 7 1146 100.0 0.0 \n",
"153 7 1070 100.0 0.0 \n",
"154 7 1087 100.0 0.0 \n",
"155 7 1230 100.0 0.0 \n",
"156 7 1128 100.0 0.0 \n",
"157 7 814 100.0 0.0 \n",
"158 7 1326 100.0 0.0 \n",
"159 7 1298 100.0 0.0 \n",
"\n",
" clusters \n",
"131 0 \n",
"132 0 \n",
"133 0 \n",
"134 0 \n",
"135 0 \n",
"136 0 \n",
"137 0 \n",
"138 0 \n",
"139 0 \n",
"140 0 \n",
"142 0 \n",
"143 0 \n",
"145 0 \n",
"146 0 \n",
"147 0 \n",
"148 0 \n",
"149 0 \n",
"151 0 \n",
"153 0 \n",
"154 0 \n",
"155 0 \n",
"156 0 \n",
"157 0 \n",
"158 0 \n",
"159 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"display(cluster_0)"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "849d9447",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 783\n",
"mean_reaction_time max - 1374\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n"
]
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"\n",
"maxVal = cluster_0['mean_reaction_time'].max()\n",
"minVal = cluster_0['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_0['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['oer'].max()\n",
"minVal = cluster_0['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "dd8d7e4f",
"metadata": {},
"source": [
"## Cluster 2"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "f9ed816e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"4"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 1])"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "e3eeb500",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>141</th>\n",
" <td>6</td>\n",
" <td>826</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>144</th>\n",
" <td>6</td>\n",
" <td>1031</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>150</th>\n",
" <td>7</td>\n",
" <td>1102</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>152</th>\n",
" <td>7</td>\n",
" <td>792</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"141 6 826 91.666667 \n",
"144 6 1031 91.666667 \n",
"150 7 1102 91.666667 \n",
"152 7 792 83.333333 \n",
"\n",
" oer clusters \n",
"141 8.333333 1 \n",
"144 8.333333 1 \n",
"150 8.333333 1 \n",
"152 16.666667 1 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"display(cluster_1)"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "2ab1bc45",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 792\n",
"mean_reaction_time max - 1102\n",
"\n",
"percentage_no_of_correct_responses min - 83.33333333\n",
"percentage_no_of_correct_responses max - 91.66666667\n",
"\n",
"oer min - 8.333333333\n",
"oer max - 16.66666667\n"
]
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"\n",
"maxVal = cluster_1['mean_reaction_time'].max()\n",
"minVal = cluster_1['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_1['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['oer'].max()\n",
"minVal = cluster_1['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "bcdc5589",
"metadata": {},
"outputs": [],
"source": [
"# importing libraries \n",
"import numpy as nm \n",
"import matplotlib.pyplot as mtp \n",
"import pandas as pd \n",
"from sklearn.cluster import DBSCAN\n",
"from numpy import unique\n",
"from numpy import where\n",
"from matplotlib import pyplot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "f448f999",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>child_gender</th>\n",
" <th>child_age</th>\n",
" <th>total_correct_responses</th>\n",
" <th>correct_responses</th>\n",
" <th>commission_errors</th>\n",
" <th>omission_errors</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>total_duration</th>\n",
" <th>diagnosis</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>game</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>79</th>\n",
" <td>80</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1448</td>\n",
" <td>74000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>81</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1331</td>\n",
" <td>78000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>81</th>\n",
" <td>82</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1426</td>\n",
" <td>74500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>83</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1632</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>83</th>\n",
" <td>84</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1340</td>\n",
" <td>72000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>85</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1564</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>85</th>\n",
" <td>86</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1366</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>86</th>\n",
" <td>87</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1291</td>\n",
" <td>74500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>87</th>\n",
" <td>88</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2032</td>\n",
" <td>71500</td>\n",
" <td>No</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>88</th>\n",
" <td>89</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1789</td>\n",
" <td>74000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>90</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1680</td>\n",
" <td>73500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>90</th>\n",
" <td>91</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1317</td>\n",
" <td>67500</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>91</th>\n",
" <td>92</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1040</td>\n",
" <td>70500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>92</th>\n",
" <td>93</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1142</td>\n",
" <td>75500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>93</th>\n",
" <td>94</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1168</td>\n",
" <td>75000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>94</th>\n",
" <td>95</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1150</td>\n",
" <td>77000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>95</th>\n",
" <td>96</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1270</td>\n",
" <td>76000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>96</th>\n",
" <td>97</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1457</td>\n",
" <td>73000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>97</th>\n",
" <td>98</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1180</td>\n",
" <td>72500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>98</th>\n",
" <td>99</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1261</td>\n",
" <td>73500</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>99</th>\n",
" <td>100</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>1234</td>\n",
" <td>71500</td>\n",
" <td>No</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>100</th>\n",
" <td>101</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1165</td>\n",
" <td>73000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>101</th>\n",
" <td>102</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1238</td>\n",
" <td>71000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>102</th>\n",
" <td>103</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>9</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1830</td>\n",
" <td>71000</td>\n",
" <td>No</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>103</th>\n",
" <td>104</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1657</td>\n",
" <td>78000</td>\n",
" <td>No</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>105</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>1817</td>\n",
" <td>74000</td>\n",
" <td>No</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>105</th>\n",
" <td>106</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1600</td>\n",
" <td>84500</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>106</th>\n",
" <td>107</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1396</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>108</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1380</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>109</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1350</td>\n",
" <td>90000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>110</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1310</td>\n",
" <td>87000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>111</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1462</td>\n",
" <td>94000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>112</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1069</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>113</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1221</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>114</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1775</td>\n",
" <td>90000</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>115</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1852</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>116</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1598</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>117</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1785</td>\n",
" <td>86000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>118</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1628</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>119</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1758</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>119</th>\n",
" <td>120</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1215</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>121</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1134</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>121</th>\n",
" <td>122</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>11</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1364</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>123</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1499</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>124</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1998</td>\n",
" <td>88000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>124</th>\n",
" <td>125</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1916</td>\n",
" <td>85500</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>125</th>\n",
" <td>126</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1152</td>\n",
" <td>89500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>127</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1086</td>\n",
" <td>92500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>128</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1207</td>\n",
" <td>86500</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>129</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1047</td>\n",
" <td>92000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>129</th>\n",
" <td>130</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>10</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1162</td>\n",
" <td>88500</td>\n",
" <td>No</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" <tr>\n",
" <th>130</th>\n",
" <td>131</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>12</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1278</td>\n",
" <td>89000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Focused</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" id child_gender child_age total_correct_responses correct_responses \\\n",
"79 80 1 4 10 10 \n",
"80 81 1 4 10 10 \n",
"81 82 1 4 10 10 \n",
"82 83 2 4 10 10 \n",
"83 84 2 4 10 9 \n",
"84 85 2 4 10 10 \n",
"85 86 2 4 10 8 \n",
"86 87 2 4 10 10 \n",
"87 88 2 4 10 8 \n",
"88 89 2 4 10 9 \n",
"89 90 2 4 10 10 \n",
"90 91 1 4 10 9 \n",
"91 92 1 4 10 10 \n",
"92 93 1 4 10 10 \n",
"93 94 1 4 10 10 \n",
"94 95 1 4 10 10 \n",
"95 96 1 4 10 10 \n",
"96 97 1 4 10 9 \n",
"97 98 1 4 10 10 \n",
"98 99 1 4 10 9 \n",
"99 100 1 4 10 7 \n",
"100 101 1 4 10 10 \n",
"101 102 1 4 10 10 \n",
"102 103 1 4 10 9 \n",
"103 104 1 4 10 8 \n",
"104 105 1 4 10 7 \n",
"105 106 2 5 12 11 \n",
"106 107 2 5 12 11 \n",
"107 108 2 5 12 12 \n",
"108 109 2 5 12 12 \n",
"109 110 2 5 12 12 \n",
"110 111 2 5 12 12 \n",
"111 112 1 5 12 12 \n",
"112 113 1 5 12 12 \n",
"113 114 1 5 12 10 \n",
"114 115 2 5 12 10 \n",
"115 116 2 5 12 11 \n",
"116 117 2 5 12 12 \n",
"117 118 2 5 12 12 \n",
"118 119 2 5 12 12 \n",
"119 120 2 5 12 12 \n",
"120 121 2 5 12 12 \n",
"121 122 2 5 12 11 \n",
"122 123 2 5 12 12 \n",
"123 124 2 5 12 12 \n",
"124 125 2 5 12 10 \n",
"125 126 2 5 12 12 \n",
"126 127 2 5 12 12 \n",
"127 128 2 5 12 12 \n",
"128 129 2 5 12 12 \n",
"129 130 2 5 12 10 \n",
"130 131 2 5 12 12 \n",
"\n",
" commission_errors omission_errors mean_reaction_time total_duration \\\n",
"79 0 0 1448 74000 \n",
"80 0 0 1331 78000 \n",
"81 0 0 1426 74500 \n",
"82 0 0 1632 76000 \n",
"83 0 1 1340 72000 \n",
"84 0 0 1564 76000 \n",
"85 0 2 1366 76000 \n",
"86 0 0 1291 74500 \n",
"87 0 2 2032 71500 \n",
"88 0 1 1789 74000 \n",
"89 0 0 1680 73500 \n",
"90 0 1 1317 67500 \n",
"91 0 0 1040 70500 \n",
"92 0 0 1142 75500 \n",
"93 0 0 1168 75000 \n",
"94 0 0 1150 77000 \n",
"95 0 0 1270 76000 \n",
"96 0 1 1457 73000 \n",
"97 0 0 1180 72500 \n",
"98 0 1 1261 73500 \n",
"99 0 3 1234 71500 \n",
"100 0 0 1165 73000 \n",
"101 0 0 1238 71000 \n",
"102 0 1 1830 71000 \n",
"103 0 2 1657 78000 \n",
"104 0 3 1817 74000 \n",
"105 0 1 1600 84500 \n",
"106 0 1 1396 86500 \n",
"107 0 0 1380 89000 \n",
"108 0 0 1350 90000 \n",
"109 0 0 1310 87000 \n",
"110 0 0 1462 94000 \n",
"111 0 0 1069 89000 \n",
"112 0 0 1221 92000 \n",
"113 0 2 1775 90000 \n",
"114 0 2 1852 89500 \n",
"115 0 1 1598 92000 \n",
"116 0 0 1785 86000 \n",
"117 0 0 1628 92000 \n",
"118 0 0 1758 86500 \n",
"119 0 0 1215 92000 \n",
"120 0 0 1134 89000 \n",
"121 0 1 1364 89000 \n",
"122 0 0 1499 89000 \n",
"123 0 0 1998 88000 \n",
"124 0 2 1916 85500 \n",
"125 0 0 1152 89500 \n",
"126 0 0 1086 92500 \n",
"127 0 0 1207 86500 \n",
"128 0 0 1047 92000 \n",
"129 0 2 1162 88500 \n",
"130 0 0 1278 89000 \n",
"\n",
" diagnosis percentage_no_of_correct_responses oer cer game \n",
"79 No 100.000000 0.000000 0.0 Focused \n",
"80 No 100.000000 0.000000 0.0 Focused \n",
"81 No 100.000000 0.000000 0.0 Focused \n",
"82 No 100.000000 0.000000 0.0 Focused \n",
"83 No 90.000000 10.000000 0.0 Focused \n",
"84 No 100.000000 0.000000 0.0 Focused \n",
"85 No 80.000000 20.000000 0.0 Focused \n",
"86 No 100.000000 0.000000 0.0 Focused \n",
"87 No 80.000000 20.000000 0.0 Focused \n",
"88 No 90.000000 10.000000 0.0 Focused \n",
"89 No 100.000000 0.000000 0.0 Focused \n",
"90 No 90.000000 10.000000 0.0 Focused \n",
"91 No 100.000000 0.000000 0.0 Focused \n",
"92 No 100.000000 0.000000 0.0 Focused \n",
"93 No 100.000000 0.000000 0.0 Focused \n",
"94 No 100.000000 0.000000 0.0 Focused \n",
"95 No 100.000000 0.000000 0.0 Focused \n",
"96 No 90.000000 10.000000 0.0 Focused \n",
"97 No 100.000000 0.000000 0.0 Focused \n",
"98 No 90.000000 10.000000 0.0 Focused \n",
"99 No 70.000000 30.000000 0.0 Focused \n",
"100 No 100.000000 0.000000 0.0 Focused \n",
"101 No 100.000000 0.000000 0.0 Focused \n",
"102 No 90.000000 10.000000 0.0 Focused \n",
"103 No 80.000000 20.000000 0.0 Focused \n",
"104 No 70.000000 30.000000 0.0 Focused \n",
"105 No 91.666667 8.333333 0.0 Focused \n",
"106 No 91.666667 8.333333 0.0 Focused \n",
"107 No 100.000000 0.000000 0.0 Focused \n",
"108 No 100.000000 0.000000 0.0 Focused \n",
"109 No 100.000000 0.000000 0.0 Focused \n",
"110 No 100.000000 0.000000 0.0 Focused \n",
"111 No 100.000000 0.000000 0.0 Focused \n",
"112 No 100.000000 0.000000 0.0 Focused \n",
"113 No 83.333333 16.666667 0.0 Focused \n",
"114 No 83.333333 16.666667 0.0 Focused \n",
"115 No 91.666667 8.333333 0.0 Focused \n",
"116 No 100.000000 0.000000 0.0 Focused \n",
"117 No 100.000000 0.000000 0.0 Focused \n",
"118 No 100.000000 0.000000 0.0 Focused \n",
"119 No 100.000000 0.000000 0.0 Focused \n",
"120 No 100.000000 0.000000 0.0 Focused \n",
"121 No 91.666667 8.333333 0.0 Focused \n",
"122 No 100.000000 0.000000 0.0 Focused \n",
"123 No 100.000000 0.000000 0.0 Focused \n",
"124 No 83.333333 16.666667 0.0 Focused \n",
"125 No 100.000000 0.000000 0.0 Focused \n",
"126 No 100.000000 0.000000 0.0 Focused \n",
"127 No 100.000000 0.000000 0.0 Focused \n",
"128 No 100.000000 0.000000 0.0 Focused \n",
"129 No 83.333333 16.666667 0.0 Focused \n",
"130 No 100.000000 0.000000 0.0 Focused "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Importing the dataset \n",
"dataset = pd.read_csv('data.csv') \n",
"dataset.drop(dataset.index[dataset['game'] == 'Alternating'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Sustained'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Selective'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Divided'], inplace = True)\n",
"\n",
"dataset.drop(dataset.index[dataset['child_age'] == 6], inplace = True)\n",
"dataset.drop(dataset.index[dataset['child_age'] == 7], inplace = True)\n",
"\n",
"display(dataset)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "12841129",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[1448. , 100. , 0. ],\n",
" [1331. , 100. , 0. ],\n",
" [1426. , 100. , 0. ],\n",
" [1632. , 100. , 0. ],\n",
" [1340. , 90. , 10. ],\n",
" [1564. , 100. , 0. ],\n",
" [1366. , 80. , 20. ],\n",
" [1291. , 100. , 0. ],\n",
" [2032. , 80. , 20. ],\n",
" [1789. , 90. , 10. ],\n",
" [1680. , 100. , 0. ],\n",
" [1317. , 90. , 10. ],\n",
" [1040. , 100. , 0. ],\n",
" [1142. , 100. , 0. ],\n",
" [1168. , 100. , 0. ],\n",
" [1150. , 100. , 0. ],\n",
" [1270. , 100. , 0. ],\n",
" [1457. , 90. , 10. ],\n",
" [1180. , 100. , 0. ],\n",
" [1261. , 90. , 10. ],\n",
" [1234. , 70. , 30. ],\n",
" [1165. , 100. , 0. ],\n",
" [1238. , 100. , 0. ],\n",
" [1830. , 90. , 10. ],\n",
" [1657. , 80. , 20. ],\n",
" [1817. , 70. , 30. ],\n",
" [1600. , 91.66666667, 8.33333333],\n",
" [1396. , 91.66666667, 8.33333333],\n",
" [1380. , 100. , 0. ],\n",
" [1350. , 100. , 0. ],\n",
" [1310. , 100. , 0. ],\n",
" [1462. , 100. , 0. ],\n",
" [1069. , 100. , 0. ],\n",
" [1221. , 100. , 0. ],\n",
" [1775. , 83.33333333, 16.66666667],\n",
" [1852. , 83.33333333, 16.66666667],\n",
" [1598. , 91.66666667, 8.33333333],\n",
" [1785. , 100. , 0. ],\n",
" [1628. , 100. , 0. ],\n",
" [1758. , 100. , 0. ],\n",
" [1215. , 100. , 0. ],\n",
" [1134. , 100. , 0. ],\n",
" [1364. , 91.66666667, 8.33333333],\n",
" [1499. , 100. , 0. ],\n",
" [1998. , 100. , 0. ],\n",
" [1916. , 83.33333333, 16.66666667],\n",
" [1152. , 100. , 0. ],\n",
" [1086. , 100. , 0. ],\n",
" [1207. , 100. , 0. ],\n",
" [1047. , 100. , 0. ],\n",
" [1162. , 83.33333333, 16.66666667],\n",
" [1278. , 100. , 0. ]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# extracting only 11-comission & 12-omission\n",
"x = dataset.iloc[:, [7, 10, 11]].values \n",
"display(x)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "d569e05b",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 0.08876077, 0.65810029, -0.65810029],\n",
" [-0.35063754, 0.65810029, -0.65810029],\n",
" [ 0.00613887, 0.65810029, -0.65810029],\n",
" [ 0.77978033, 0.65810029, -0.65810029],\n",
" [-0.31683767, -0.56408597, 0.56408597],\n",
" [ 0.52440354, 0.65810029, -0.65810029],\n",
" [-0.2191936 , -1.78627223, 1.78627223],\n",
" [-0.50085918, 0.65810029, -0.65810029],\n",
" [ 2.28199678, -1.78627223, 1.78627223],\n",
" [ 1.36940029, -0.56408597, 0.56408597],\n",
" [ 0.96004631, 0.65810029, -0.65810029],\n",
" [-0.40321512, -0.56408597, 0.56408597],\n",
" [-1.4435 , 0.65810029, -0.65810029],\n",
" [-1.06043481, 0.65810029, -0.65810029],\n",
" [-0.96279074, 0.65810029, -0.65810029],\n",
" [-1.03039048, 0.65810029, -0.65810029],\n",
" [-0.57972555, 0.65810029, -0.65810029],\n",
" [ 0.12256064, -0.56408597, 0.56408597],\n",
" [-0.91772425, 0.65810029, -0.65810029],\n",
" [-0.61352542, -0.56408597, 0.56408597],\n",
" [-0.71492503, -3.00845849, 3.00845849],\n",
" [-0.97405736, 0.65810029, -0.65810029],\n",
" [-0.69990286, 0.65810029, -0.65810029],\n",
" [ 1.52337747, -0.56408597, 0.56408597],\n",
" [ 0.87366886, -1.78627223, 1.78627223],\n",
" [ 1.47455544, -3.00845849, 3.00845849],\n",
" [ 0.65960302, -0.36038826, 0.36038826],\n",
" [-0.10652737, -0.36038826, 0.36038826],\n",
" [-0.16661603, 0.65810029, -0.65810029],\n",
" [-0.27928226, 0.65810029, -0.65810029],\n",
" [-0.4295039 , 0.65810029, -0.65810029],\n",
" [ 0.14133835, 0.65810029, -0.65810029],\n",
" [-1.33458931, 0.65810029, -0.65810029],\n",
" [-0.76374706, 0.65810029, -0.65810029],\n",
" [ 1.31682271, -1.37887681, 1.37887681],\n",
" [ 1.60599938, -1.37887681, 1.37887681],\n",
" [ 0.65209194, -0.36038826, 0.36038826],\n",
" [ 1.35437812, 0.65810029, -0.65810029],\n",
" [ 0.76475817, 0.65810029, -0.65810029],\n",
" [ 1.25297851, 0.65810029, -0.65810029],\n",
" [-0.78628031, 0.65810029, -0.65810029],\n",
" [-1.09047914, 0.65810029, -0.65810029],\n",
" [-0.22670468, -0.36038826, 0.36038826],\n",
" [ 0.28029337, 0.65810029, -0.65810029],\n",
" [ 2.15430838, 0.65810029, -0.65810029],\n",
" [ 1.84635401, -1.37887681, 1.37887681],\n",
" [-1.0228794 , 0.65810029, -0.65810029],\n",
" [-1.27074511, 0.65810029, -0.65810029],\n",
" [-0.81632464, 0.65810029, -0.65810029],\n",
" [-1.41721122, 0.65810029, -0.65810029],\n",
" [-0.98532399, -1.37887681, 1.37887681],\n",
" [-0.54968122, 0.65810029, -0.65810029]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# standardizing the data\n",
"from sklearn.preprocessing import StandardScaler\n",
"scaler = StandardScaler()\n",
"new_df = scaler.fit_transform(x)\n",
"\n",
"# statistics of scaled data\n",
"pd.DataFrame(new_df).describe()\n",
"\n",
"display(new_df)\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "b5fc4f60",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 4. , 0.08876077, 0.65810029, -0.65810029],\n",
" [ 4. , -0.35063754, 0.65810029, -0.65810029],\n",
" [ 4. , 0.00613887, 0.65810029, -0.65810029],\n",
" [ 4. , 0.77978033, 0.65810029, -0.65810029],\n",
" [ 4. , -0.31683767, -0.56408597, 0.56408597],\n",
" [ 4. , 0.52440354, 0.65810029, -0.65810029],\n",
" [ 4. , -0.2191936 , -1.78627223, 1.78627223],\n",
" [ 4. , -0.50085918, 0.65810029, -0.65810029],\n",
" [ 4. , 2.28199678, -1.78627223, 1.78627223],\n",
" [ 4. , 1.36940029, -0.56408597, 0.56408597],\n",
" [ 4. , 0.96004631, 0.65810029, -0.65810029],\n",
" [ 4. , -0.40321512, -0.56408597, 0.56408597],\n",
" [ 4. , -1.4435 , 0.65810029, -0.65810029],\n",
" [ 4. , -1.06043481, 0.65810029, -0.65810029],\n",
" [ 4. , -0.96279074, 0.65810029, -0.65810029],\n",
" [ 4. , -1.03039048, 0.65810029, -0.65810029],\n",
" [ 4. , -0.57972555, 0.65810029, -0.65810029],\n",
" [ 4. , 0.12256064, -0.56408597, 0.56408597],\n",
" [ 4. , -0.91772425, 0.65810029, -0.65810029],\n",
" [ 4. , -0.61352542, -0.56408597, 0.56408597],\n",
" [ 4. , -0.71492503, -3.00845849, 3.00845849],\n",
" [ 4. , -0.97405736, 0.65810029, -0.65810029],\n",
" [ 4. , -0.69990286, 0.65810029, -0.65810029],\n",
" [ 4. , 1.52337747, -0.56408597, 0.56408597],\n",
" [ 4. , 0.87366886, -1.78627223, 1.78627223],\n",
" [ 4. , 1.47455544, -3.00845849, 3.00845849],\n",
" [ 5. , 0.65960302, -0.36038826, 0.36038826],\n",
" [ 5. , -0.10652737, -0.36038826, 0.36038826],\n",
" [ 5. , -0.16661603, 0.65810029, -0.65810029],\n",
" [ 5. , -0.27928226, 0.65810029, -0.65810029],\n",
" [ 5. , -0.4295039 , 0.65810029, -0.65810029],\n",
" [ 5. , 0.14133835, 0.65810029, -0.65810029],\n",
" [ 5. , -1.33458931, 0.65810029, -0.65810029],\n",
" [ 5. , -0.76374706, 0.65810029, -0.65810029],\n",
" [ 5. , 1.31682271, -1.37887681, 1.37887681],\n",
" [ 5. , 1.60599938, -1.37887681, 1.37887681],\n",
" [ 5. , 0.65209194, -0.36038826, 0.36038826],\n",
" [ 5. , 1.35437812, 0.65810029, -0.65810029],\n",
" [ 5. , 0.76475817, 0.65810029, -0.65810029],\n",
" [ 5. , 1.25297851, 0.65810029, -0.65810029],\n",
" [ 5. , -0.78628031, 0.65810029, -0.65810029],\n",
" [ 5. , -1.09047914, 0.65810029, -0.65810029],\n",
" [ 5. , -0.22670468, -0.36038826, 0.36038826],\n",
" [ 5. , 0.28029337, 0.65810029, -0.65810029],\n",
" [ 5. , 2.15430838, 0.65810029, -0.65810029],\n",
" [ 5. , 1.84635401, -1.37887681, 1.37887681],\n",
" [ 5. , -1.0228794 , 0.65810029, -0.65810029],\n",
" [ 5. , -1.27074511, 0.65810029, -0.65810029],\n",
" [ 5. , -0.81632464, 0.65810029, -0.65810029],\n",
" [ 5. , -1.41721122, 0.65810029, -0.65810029],\n",
" [ 5. , -0.98532399, -1.37887681, 1.37887681],\n",
" [ 5. , -0.54968122, 0.65810029, -0.65810029]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"x = dataset.iloc[:, [2, 7, 10, 11]].copy()\n",
"x[['mean_reaction_time', 'percentage_no_of_correct_responses', 'oer']] = new_df\n",
"x.head()\n",
"x = x.to_numpy()\n",
"display(x)\n"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "5d1c61bf",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.datasets import make_classification\n",
"from sklearn.cluster import MeanShift\n",
"\n",
"# define the model\n",
"model = MeanShift()\n",
"# fit model and predict clusters\n",
"yhat = model.fit_predict(x)\n",
"# retrieve unique clusters\n",
"clusters = unique(yhat)"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "3343196f",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"[[ 4.53125 -0.47609609 0.59444476 -0.59444476]\n",
" [ 4.4 0.26602231 -0.48260688 0.48260688]\n",
" [ 4.42857143 1.54537422 -1.26247812 1.26247812]\n",
" [ 4.33333333 -0.11028291 -1.65047376 1.65047376]\n",
" [ 4. 1.47455544 -3.00845849 3.00845849]\n",
" [ 4. -0.71492503 -3.00845849 3.00845849]]\n",
"Estimated clusters: 6\n"
]
}
],
"source": [
"ms = MeanShift()\n",
"ms.fit(x)\n",
"labels = ms.labels_\n",
"cluster_centers = ms.cluster_centers_\n",
"print(cluster_centers)\n",
"n_clusters_ = len(nm.unique(labels))\n",
"print(\"Estimated clusters:\", n_clusters_)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "2e691585",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>79</th>\n",
" <td>4</td>\n",
" <td>1448</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>4</td>\n",
" <td>1331</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>81</th>\n",
" <td>4</td>\n",
" <td>1426</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>4</td>\n",
" <td>1632</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>83</th>\n",
" <td>4</td>\n",
" <td>1340</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>4</td>\n",
" <td>1564</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>85</th>\n",
" <td>4</td>\n",
" <td>1366</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>86</th>\n",
" <td>4</td>\n",
" <td>1291</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>87</th>\n",
" <td>4</td>\n",
" <td>2032</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>88</th>\n",
" <td>4</td>\n",
" <td>1789</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>4</td>\n",
" <td>1680</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>90</th>\n",
" <td>4</td>\n",
" <td>1317</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>91</th>\n",
" <td>4</td>\n",
" <td>1040</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>92</th>\n",
" <td>4</td>\n",
" <td>1142</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>93</th>\n",
" <td>4</td>\n",
" <td>1168</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>94</th>\n",
" <td>4</td>\n",
" <td>1150</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>95</th>\n",
" <td>4</td>\n",
" <td>1270</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>96</th>\n",
" <td>4</td>\n",
" <td>1457</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>97</th>\n",
" <td>4</td>\n",
" <td>1180</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>98</th>\n",
" <td>4</td>\n",
" <td>1261</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>99</th>\n",
" <td>4</td>\n",
" <td>1234</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>100</th>\n",
" <td>4</td>\n",
" <td>1165</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>101</th>\n",
" <td>4</td>\n",
" <td>1238</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>102</th>\n",
" <td>4</td>\n",
" <td>1830</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>103</th>\n",
" <td>4</td>\n",
" <td>1657</td>\n",
" <td>80.000000</td>\n",
" <td>20.000000</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>4</td>\n",
" <td>1817</td>\n",
" <td>70.000000</td>\n",
" <td>30.000000</td>\n",
" <td>4</td>\n",
" </tr>\n",
" <tr>\n",
" <th>105</th>\n",
" <td>5</td>\n",
" <td>1600</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>106</th>\n",
" <td>5</td>\n",
" <td>1396</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>5</td>\n",
" <td>1380</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>5</td>\n",
" <td>1350</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>5</td>\n",
" <td>1310</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>5</td>\n",
" <td>1462</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>5</td>\n",
" <td>1069</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>5</td>\n",
" <td>1221</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>5</td>\n",
" <td>1775</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>5</td>\n",
" <td>1852</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>5</td>\n",
" <td>1598</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>5</td>\n",
" <td>1785</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>5</td>\n",
" <td>1628</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>5</td>\n",
" <td>1758</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>119</th>\n",
" <td>5</td>\n",
" <td>1215</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>5</td>\n",
" <td>1134</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>121</th>\n",
" <td>5</td>\n",
" <td>1364</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>5</td>\n",
" <td>1499</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>5</td>\n",
" <td>1998</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>124</th>\n",
" <td>5</td>\n",
" <td>1916</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>125</th>\n",
" <td>5</td>\n",
" <td>1152</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>5</td>\n",
" <td>1086</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>5</td>\n",
" <td>1207</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>5</td>\n",
" <td>1047</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>129</th>\n",
" <td>5</td>\n",
" <td>1162</td>\n",
" <td>83.333333</td>\n",
" <td>16.666667</td>\n",
" <td>3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>130</th>\n",
" <td>5</td>\n",
" <td>1278</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"79 4 1448 100.000000 \n",
"80 4 1331 100.000000 \n",
"81 4 1426 100.000000 \n",
"82 4 1632 100.000000 \n",
"83 4 1340 90.000000 \n",
"84 4 1564 100.000000 \n",
"85 4 1366 80.000000 \n",
"86 4 1291 100.000000 \n",
"87 4 2032 80.000000 \n",
"88 4 1789 90.000000 \n",
"89 4 1680 100.000000 \n",
"90 4 1317 90.000000 \n",
"91 4 1040 100.000000 \n",
"92 4 1142 100.000000 \n",
"93 4 1168 100.000000 \n",
"94 4 1150 100.000000 \n",
"95 4 1270 100.000000 \n",
"96 4 1457 90.000000 \n",
"97 4 1180 100.000000 \n",
"98 4 1261 90.000000 \n",
"99 4 1234 70.000000 \n",
"100 4 1165 100.000000 \n",
"101 4 1238 100.000000 \n",
"102 4 1830 90.000000 \n",
"103 4 1657 80.000000 \n",
"104 4 1817 70.000000 \n",
"105 5 1600 91.666667 \n",
"106 5 1396 91.666667 \n",
"107 5 1380 100.000000 \n",
"108 5 1350 100.000000 \n",
"109 5 1310 100.000000 \n",
"110 5 1462 100.000000 \n",
"111 5 1069 100.000000 \n",
"112 5 1221 100.000000 \n",
"113 5 1775 83.333333 \n",
"114 5 1852 83.333333 \n",
"115 5 1598 91.666667 \n",
"116 5 1785 100.000000 \n",
"117 5 1628 100.000000 \n",
"118 5 1758 100.000000 \n",
"119 5 1215 100.000000 \n",
"120 5 1134 100.000000 \n",
"121 5 1364 91.666667 \n",
"122 5 1499 100.000000 \n",
"123 5 1998 100.000000 \n",
"124 5 1916 83.333333 \n",
"125 5 1152 100.000000 \n",
"126 5 1086 100.000000 \n",
"127 5 1207 100.000000 \n",
"128 5 1047 100.000000 \n",
"129 5 1162 83.333333 \n",
"130 5 1278 100.000000 \n",
"\n",
" oer clusters \n",
"79 0.000000 0 \n",
"80 0.000000 0 \n",
"81 0.000000 0 \n",
"82 0.000000 0 \n",
"83 10.000000 1 \n",
"84 0.000000 0 \n",
"85 20.000000 3 \n",
"86 0.000000 0 \n",
"87 20.000000 2 \n",
"88 10.000000 2 \n",
"89 0.000000 0 \n",
"90 10.000000 1 \n",
"91 0.000000 0 \n",
"92 0.000000 0 \n",
"93 0.000000 0 \n",
"94 0.000000 0 \n",
"95 0.000000 0 \n",
"96 10.000000 1 \n",
"97 0.000000 0 \n",
"98 10.000000 1 \n",
"99 30.000000 5 \n",
"100 0.000000 0 \n",
"101 0.000000 0 \n",
"102 10.000000 2 \n",
"103 20.000000 3 \n",
"104 30.000000 4 \n",
"105 8.333333 1 \n",
"106 8.333333 1 \n",
"107 0.000000 0 \n",
"108 0.000000 0 \n",
"109 0.000000 0 \n",
"110 0.000000 0 \n",
"111 0.000000 0 \n",
"112 0.000000 0 \n",
"113 16.666667 2 \n",
"114 16.666667 2 \n",
"115 8.333333 1 \n",
"116 0.000000 0 \n",
"117 0.000000 0 \n",
"118 0.000000 0 \n",
"119 0.000000 0 \n",
"120 0.000000 0 \n",
"121 8.333333 1 \n",
"122 0.000000 0 \n",
"123 0.000000 1 \n",
"124 16.666667 2 \n",
"125 0.000000 0 \n",
"126 0.000000 0 \n",
"127 0.000000 0 \n",
"128 0.000000 0 \n",
"129 16.666667 3 \n",
"130 0.000000 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"new_df = dataset.iloc[:, [2, 7, 10, 11]].copy()\n",
"new_df['clusters'] = yhat\n",
"new_df.head()\n",
"display(new_df)"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "50a9adbb",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Silhouette Coefficient: 0.361\n",
"Calinski-Harabasz Index: 25.252\n",
"Davies-Bouldin Index: 0.833\n"
]
}
],
"source": [
"from sklearn.metrics import silhouette_score,calinski_harabasz_score,davies_bouldin_score\n",
"\n",
"print(\"Silhouette Coefficient: %0.3f\" % silhouette_score(x, yhat))\n",
"print(\"Calinski-Harabasz Index: %0.3f\" % calinski_harabasz_score(x, yhat))\n",
"print(\"Davies-Bouldin Index: %0.3f\" % davies_bouldin_score(x, yhat))"
]
},
{
"cell_type": "markdown",
"id": "900a0d3f",
"metadata": {},
"source": [
"# Cluster Analysis"
]
},
{
"cell_type": "markdown",
"id": "262e8a4f",
"metadata": {},
"source": [
"## Cluster 1"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "ba8fef3b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"32"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 0])"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "6c5b7397",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>79</th>\n",
" <td>4</td>\n",
" <td>1448</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>80</th>\n",
" <td>4</td>\n",
" <td>1331</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>81</th>\n",
" <td>4</td>\n",
" <td>1426</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>4</td>\n",
" <td>1632</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>4</td>\n",
" <td>1564</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>86</th>\n",
" <td>4</td>\n",
" <td>1291</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>89</th>\n",
" <td>4</td>\n",
" <td>1680</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>91</th>\n",
" <td>4</td>\n",
" <td>1040</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>92</th>\n",
" <td>4</td>\n",
" <td>1142</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>93</th>\n",
" <td>4</td>\n",
" <td>1168</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>94</th>\n",
" <td>4</td>\n",
" <td>1150</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>95</th>\n",
" <td>4</td>\n",
" <td>1270</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>97</th>\n",
" <td>4</td>\n",
" <td>1180</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>100</th>\n",
" <td>4</td>\n",
" <td>1165</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>101</th>\n",
" <td>4</td>\n",
" <td>1238</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>5</td>\n",
" <td>1380</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>5</td>\n",
" <td>1350</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>5</td>\n",
" <td>1310</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>5</td>\n",
" <td>1462</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>5</td>\n",
" <td>1069</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>5</td>\n",
" <td>1221</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>5</td>\n",
" <td>1785</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>5</td>\n",
" <td>1628</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>5</td>\n",
" <td>1758</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>119</th>\n",
" <td>5</td>\n",
" <td>1215</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>5</td>\n",
" <td>1134</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>5</td>\n",
" <td>1499</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>125</th>\n",
" <td>5</td>\n",
" <td>1152</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>5</td>\n",
" <td>1086</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>5</td>\n",
" <td>1207</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>5</td>\n",
" <td>1047</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>130</th>\n",
" <td>5</td>\n",
" <td>1278</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses oer \\\n",
"79 4 1448 100.0 0.0 \n",
"80 4 1331 100.0 0.0 \n",
"81 4 1426 100.0 0.0 \n",
"82 4 1632 100.0 0.0 \n",
"84 4 1564 100.0 0.0 \n",
"86 4 1291 100.0 0.0 \n",
"89 4 1680 100.0 0.0 \n",
"91 4 1040 100.0 0.0 \n",
"92 4 1142 100.0 0.0 \n",
"93 4 1168 100.0 0.0 \n",
"94 4 1150 100.0 0.0 \n",
"95 4 1270 100.0 0.0 \n",
"97 4 1180 100.0 0.0 \n",
"100 4 1165 100.0 0.0 \n",
"101 4 1238 100.0 0.0 \n",
"107 5 1380 100.0 0.0 \n",
"108 5 1350 100.0 0.0 \n",
"109 5 1310 100.0 0.0 \n",
"110 5 1462 100.0 0.0 \n",
"111 5 1069 100.0 0.0 \n",
"112 5 1221 100.0 0.0 \n",
"116 5 1785 100.0 0.0 \n",
"117 5 1628 100.0 0.0 \n",
"118 5 1758 100.0 0.0 \n",
"119 5 1215 100.0 0.0 \n",
"120 5 1134 100.0 0.0 \n",
"122 5 1499 100.0 0.0 \n",
"125 5 1152 100.0 0.0 \n",
"126 5 1086 100.0 0.0 \n",
"127 5 1207 100.0 0.0 \n",
"128 5 1047 100.0 0.0 \n",
"130 5 1278 100.0 0.0 \n",
"\n",
" clusters \n",
"79 0 \n",
"80 0 \n",
"81 0 \n",
"82 0 \n",
"84 0 \n",
"86 0 \n",
"89 0 \n",
"91 0 \n",
"92 0 \n",
"93 0 \n",
"94 0 \n",
"95 0 \n",
"97 0 \n",
"100 0 \n",
"101 0 \n",
"107 0 \n",
"108 0 \n",
"109 0 \n",
"110 0 \n",
"111 0 \n",
"112 0 \n",
"116 0 \n",
"117 0 \n",
"118 0 \n",
"119 0 \n",
"120 0 \n",
"122 0 \n",
"125 0 \n",
"126 0 \n",
"127 0 \n",
"128 0 \n",
"130 0 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"display(cluster_0)"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "849d9447",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 1040\n",
"mean_reaction_time max - 1785\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n"
]
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"\n",
"maxVal = cluster_0['mean_reaction_time'].max()\n",
"minVal = cluster_0['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_0['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['oer'].max()\n",
"minVal = cluster_0['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "dd8d7e4f",
"metadata": {},
"source": [
"## Cluster 2"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "f9ed816e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"9"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 1])"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "e3eeb500",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>83</th>\n",
" <td>4</td>\n",
" <td>1340</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>90</th>\n",
" <td>4</td>\n",
" <td>1317</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>96</th>\n",
" <td>4</td>\n",
" <td>1457</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>98</th>\n",
" <td>4</td>\n",
" <td>1261</td>\n",
" <td>90.000000</td>\n",
" <td>10.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>105</th>\n",
" <td>5</td>\n",
" <td>1600</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>106</th>\n",
" <td>5</td>\n",
" <td>1396</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>5</td>\n",
" <td>1598</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>121</th>\n",
" <td>5</td>\n",
" <td>1364</td>\n",
" <td>91.666667</td>\n",
" <td>8.333333</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>5</td>\n",
" <td>1998</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age mean_reaction_time percentage_no_of_correct_responses \\\n",
"83 4 1340 90.000000 \n",
"90 4 1317 90.000000 \n",
"96 4 1457 90.000000 \n",
"98 4 1261 90.000000 \n",
"105 5 1600 91.666667 \n",
"106 5 1396 91.666667 \n",
"115 5 1598 91.666667 \n",
"121 5 1364 91.666667 \n",
"123 5 1998 100.000000 \n",
"\n",
" oer clusters \n",
"83 10.000000 1 \n",
"90 10.000000 1 \n",
"96 10.000000 1 \n",
"98 10.000000 1 \n",
"105 8.333333 1 \n",
"106 8.333333 1 \n",
"115 8.333333 1 \n",
"121 8.333333 1 \n",
"123 0.000000 1 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"display(cluster_1)"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "bb910e6a",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"mean_reaction_time min - 1261\n",
"mean_reaction_time max - 1998\n",
"\n",
"percentage_no_of_correct_responses min - 90.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 10.0\n"
]
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"\n",
"maxVal = cluster_1['mean_reaction_time'].max()\n",
"minVal = cluster_1['mean_reaction_time'].min()\n",
"\n",
"print(\"mean_reaction_time min - \", minVal)\n",
"print(\"mean_reaction_time max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_1['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['oer'].max()\n",
"minVal = cluster_1['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "e7f55f44",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
This source diff could not be displayed because it is too large. You can view the blob instead.
This source diff could not be displayed because it is too large. You can view the blob instead.
This source diff could not be displayed because it is too large. You can view the blob instead.
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "bcdc5589",
"metadata": {},
"outputs": [],
"source": [
"# importing libraries \n",
"import numpy as nm \n",
"import matplotlib.pyplot as mtp \n",
"import pandas as pd \n",
"from sklearn.cluster import DBSCAN\n",
"from numpy import unique\n",
"from numpy import where\n",
"from matplotlib import pyplot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "f448f999",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>child_gender</th>\n",
" <th>child_age</th>\n",
" <th>total_correct_responses</th>\n",
" <th>correct_responses</th>\n",
" <th>commission_errors</th>\n",
" <th>omission_errors</th>\n",
" <th>mean_reaction_time</th>\n",
" <th>total_duration</th>\n",
" <th>diagnosis</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>game</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>160</th>\n",
" <td>161</td>\n",
" <td>1</td>\n",
" <td>4</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>3459</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>161</th>\n",
" <td>162</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>3000</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>162</th>\n",
" <td>163</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>10888</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>163</th>\n",
" <td>164</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>7081</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>164</th>\n",
" <td>165</td>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" <td>7</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>9953</td>\n",
" <td>No</td>\n",
" <td>85.714286</td>\n",
" <td>14.285714</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>319</th>\n",
" <td>320</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>12332</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>320</th>\n",
" <td>321</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>8190</td>\n",
" <td>No</td>\n",
" <td>0.000000</td>\n",
" <td>100.000000</td>\n",
" <td>50.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>321</th>\n",
" <td>322</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>7</td>\n",
" <td>5</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>6749</td>\n",
" <td>No</td>\n",
" <td>71.428571</td>\n",
" <td>28.571429</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>322</th>\n",
" <td>323</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>7</td>\n",
" <td>7</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>7795</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" <tr>\n",
" <th>323</th>\n",
" <td>324</td>\n",
" <td>1</td>\n",
" <td>7</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>14779</td>\n",
" <td>No</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>Selective</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>164 rows × 14 columns</p>\n",
"</div>"
],
"text/plain": [
" id child_gender child_age total_correct_responses correct_responses \\\n",
"160 161 1 4 8 8 \n",
"161 162 2 4 6 6 \n",
"162 163 2 4 6 6 \n",
"163 164 2 4 6 6 \n",
"164 165 2 4 7 6 \n",
".. ... ... ... ... ... \n",
"319 320 1 7 8 8 \n",
"320 321 1 7 6 0 \n",
"321 322 1 7 7 5 \n",
"322 323 1 7 7 7 \n",
"323 324 1 7 6 6 \n",
"\n",
" commission_errors omission_errors mean_reaction_time total_duration \\\n",
"160 0 0 0 3459 \n",
"161 0 0 0 3000 \n",
"162 0 0 0 10888 \n",
"163 0 0 0 7081 \n",
"164 0 1 0 9953 \n",
".. ... ... ... ... \n",
"319 0 0 0 12332 \n",
"320 3 6 0 8190 \n",
"321 0 2 0 6749 \n",
"322 0 0 0 7795 \n",
"323 0 0 0 14779 \n",
"\n",
" diagnosis percentage_no_of_correct_responses oer cer game \n",
"160 No 100.000000 0.000000 0.0 Selective \n",
"161 No 100.000000 0.000000 0.0 Selective \n",
"162 No 100.000000 0.000000 0.0 Selective \n",
"163 No 100.000000 0.000000 0.0 Selective \n",
"164 No 85.714286 14.285714 0.0 Selective \n",
".. ... ... ... ... ... \n",
"319 No 100.000000 0.000000 0.0 Selective \n",
"320 No 0.000000 100.000000 50.0 Selective \n",
"321 No 71.428571 28.571429 0.0 Selective \n",
"322 No 100.000000 0.000000 0.0 Selective \n",
"323 No 100.000000 0.000000 0.0 Selective \n",
"\n",
"[164 rows x 14 columns]"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# Importing the dataset \n",
"dataset = pd.read_csv('data.csv') \n",
"dataset.drop(dataset.index[dataset['game'] == 'Alternating'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Sustained'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Focused'], inplace = True)\n",
"dataset.drop(dataset.index[dataset['game'] == 'Divided'], inplace = True)\n",
"display(dataset)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "12841129",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[3.45900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [3.00000000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.08880000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.08100000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.95300000e+03, 8.57142857e+01, 1.42857143e+01, 0.00000000e+00],\n",
" [1.42070000e+04, 1.00000000e+02, 0.00000000e+00, 2.22222222e+01],\n",
" [1.40360000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.26460000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.25100000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.00260000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.14820000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.20860000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.08160000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [6.34500000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.12010000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.02360000e+04, 8.75000000e+01, 1.25000000e+01, 0.00000000e+00],\n",
" [1.08300000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.03480000e+04, 1.25000000e+01, 8.75000000e+01, 0.00000000e+00],\n",
" [1.62220000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.05950000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.39870000e+04, 7.50000000e+01, 2.50000000e+01, 0.00000000e+00],\n",
" [1.54400000e+04, 8.57142857e+01, 1.42857143e+01, 0.00000000e+00],\n",
" [2.22960000e+04, 1.00000000e+02, 0.00000000e+00, 3.33333333e+01],\n",
" [1.17240000e+04, 3.33333333e+01, 6.66666667e+01, 0.00000000e+00],\n",
" [1.22480000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.11010000e+04, 8.57142857e+01, 1.42857143e+01, 0.00000000e+00],\n",
" [1.11910000e+04, 8.33333333e+01, 1.66666667e+01, 0.00000000e+00],\n",
" [1.36940000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [3.23100000e+03, 8.75000000e+01, 1.25000000e+01, 0.00000000e+00],\n",
" [9.90700000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.12920000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.74950000e+04, 1.00000000e+02, 0.00000000e+00, 7.14285714e+01],\n",
" [1.16270000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [2.32740000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [6.27600000e+03, 1.66666667e+01, 8.33333333e+01, 0.00000000e+00],\n",
" [7.85300000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.57400000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.80100000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.41300000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.30000000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.56450000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.49870000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.82480000e+04, 1.00000000e+02, 0.00000000e+00, 1.25000000e+01],\n",
" [1.31300000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.93400000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [3.03870000e+04, 1.00000000e+02, 0.00000000e+00, 1.66666667e+01],\n",
" [1.74640000e+04, 1.00000000e+02, 0.00000000e+00, 1.66666667e+01],\n",
" [2.39880000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.28070000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [2.55610000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [2.23750000e+04, 1.00000000e+02, 0.00000000e+00, 6.66666667e+01],\n",
" [1.13250000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.48200000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.68690000e+04, 8.75000000e+01, 1.25000000e+01, 0.00000000e+00],\n",
" [1.41300000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.23670000e+04, 7.14285714e+01, 2.85714286e+01, 0.00000000e+00],\n",
" [2.06640000e+04, 1.00000000e+02, 0.00000000e+00, 1.66666667e+01],\n",
" [2.31060000e+04, 1.00000000e+02, 0.00000000e+00, 1.66666667e+01],\n",
" [1.19780000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.03580000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.19410000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.34150000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.07400000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.00500000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.58790000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.26770000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.74400000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.08490000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.05770000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.06280000e+04, 1.00000000e+02, 0.00000000e+00, 1.25000000e+01],\n",
" [1.07640000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.25530000e+04, 6.66666667e+01, 3.33333333e+01, 0.00000000e+00],\n",
" [1.24130000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.87900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.20000000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.37500000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [5.43700000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.47700000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.93500000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.39790000e+04, 1.00000000e+02, 0.00000000e+00, 1.42857143e+01],\n",
" [1.65020000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.24260000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.22190000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.01400000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.37300000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.83800000e+03, 8.33333333e+01, 1.66666667e+01, 1.66666667e+01],\n",
" [9.29900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.59050000e+04, 8.57142857e+01, 1.42857143e+01, 0.00000000e+00],\n",
" [1.13420000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.01240000e+04, 1.00000000e+02, 0.00000000e+00, 1.66666667e+01],\n",
" [9.88900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.31560000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.37860000e+04, 8.33333333e+01, 1.66666667e+01, 0.00000000e+00],\n",
" [1.43970000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.00580000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.08740000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.08740000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [5.11200000e+03, 3.33333333e+01, 6.66666667e+01, 0.00000000e+00],\n",
" [1.24100000e+04, 1.00000000e+02, 0.00000000e+00, 1.42857143e+01],\n",
" [1.33050000e+04, 8.33333333e+01, 1.66666667e+01, 0.00000000e+00],\n",
" [1.10750000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.05900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.00000000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.28890000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [2.57190000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [5.04610000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.98860000e+04, 1.00000000e+02, 0.00000000e+00, 1.42857143e+01],\n",
" [4.21990000e+04, 1.00000000e+02, 0.00000000e+00, 8.33333333e+01],\n",
" [1.03810000e+04, 5.00000000e+01, 5.00000000e+01, 0.00000000e+00],\n",
" [6.20200000e+03, 6.66666667e+01, 3.33333333e+01, 3.33333333e+01],\n",
" [4.78000000e+03, 1.00000000e+02, 0.00000000e+00, 1.42857143e+01],\n",
" [1.90550000e+04, 5.00000000e+01, 5.00000000e+01, 0.00000000e+00],\n",
" [7.02600000e+03, 6.66666667e+01, 3.33333333e+01, 0.00000000e+00],\n",
" [1.17090000e+04, 8.75000000e+01, 1.25000000e+01, 0.00000000e+00],\n",
" [1.06880000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.46340000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.38610000e+04, 1.00000000e+02, 0.00000000e+00, 1.25000000e+01],\n",
" [1.21830000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.54290000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.03700000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.42630000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.36920000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.11330000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.16450000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.79200000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.13800000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [2.01770000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.17300000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.30270000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.28600000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.97000000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.24430000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.43890000e+04, 8.75000000e+01, 1.25000000e+01, 0.00000000e+00],\n",
" [8.37000000e+03, 1.66666667e+01, 8.33333333e+01, 1.66666667e+01],\n",
" [1.40110000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [2.36890000e+04, 8.33333333e+01, 1.66666667e+01, 3.33333333e+01],\n",
" [1.61690000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.12600000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.44260000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.01810000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [4.78290000e+04, 1.00000000e+02, 0.00000000e+00, 5.71428571e+01],\n",
" [1.45930000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.15200000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.93500000e+03, 8.57142857e+01, 1.42857143e+01, 0.00000000e+00],\n",
" [1.15260000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.09000000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.32500000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.13240000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.48250000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.65900000e+04, 8.75000000e+01, 1.25000000e+01, 0.00000000e+00],\n",
" [1.82770000e+04, 8.57142857e+01, 1.42857143e+01, 0.00000000e+00],\n",
" [6.94200000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.15400000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.86600000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [9.01900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [5.56800000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [7.34900000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.44060000e+04, 1.66666667e+01, 8.33333333e+01, 0.00000000e+00],\n",
" [9.16600000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.23320000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [8.19000000e+03, 0.00000000e+00, 1.00000000e+02, 5.00000000e+01],\n",
" [6.74900000e+03, 7.14285714e+01, 2.85714286e+01, 0.00000000e+00],\n",
" [7.79500000e+03, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00],\n",
" [1.47790000e+04, 1.00000000e+02, 0.00000000e+00, 0.00000000e+00]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# extracting only 11-comission & 12-omission\n",
"x = dataset.iloc[:, [8, 10, 11, 12]].values \n",
"display(x)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "d569e05b",
"metadata": {
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"array([[-1.42198814e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.49278251e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.76168192e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-8.63345004e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.20378940e-01, -4.17936084e-01, 4.17936084e-01,\n",
" -3.16765400e-01],\n",
" [ 2.35741406e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 1.42682072e+00],\n",
" [ 2.09367034e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.02113725e-03, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-8.37124867e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.09119705e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.84551951e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-9.13933502e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.87273190e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-9.76862769e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.27892294e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.76730125e-01, -3.19692150e-01, 3.19692150e-01,\n",
" -3.16765400e-01],\n",
" [-2.85113885e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.59455683e-01, -4.44593737e+00, 4.44593737e+00,\n",
" -3.16765400e-01],\n",
" [ 5.46527137e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.21359367e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.01809466e-01, -1.00739969e+00, 1.00739969e+00,\n",
" -3.16765400e-01],\n",
" [ 4.25914511e-01, -4.17936084e-01, 4.17936084e-01,\n",
" -3.16765400e-01],\n",
" [ 1.48335718e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 2.29861377e+00],\n",
" [-1.47226816e-01, -3.29975814e+00, 3.29975814e+00,\n",
" -3.16765400e-01],\n",
" [-6.64071029e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.43315903e-01, -4.17936084e-01, 4.17936084e-01,\n",
" -3.16765400e-01],\n",
" [-2.29434655e-01, -5.48927996e-01, 5.48927996e-01,\n",
" -3.16765400e-01],\n",
" [ 1.56618290e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.45715397e+00, -3.19692150e-01, 3.19692150e-01,\n",
" -3.16765400e-01],\n",
" [-4.27473800e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.13856809e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 7.42869685e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 5.28761855e+00],\n",
" [-1.62187718e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.63420008e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-9.87505060e-01, -4.21670152e+00, 4.21670152e+00,\n",
" -3.16765400e-01],\n",
" [-7.44274739e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-6.33070514e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.52295015e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-6.57902526e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-6.75331204e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 4.57532910e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.56045560e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 8.59009465e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 6.64001790e-01],\n",
" [ 6.96291325e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.23309426e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.73128142e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 9.90924187e-01],\n",
" [ 7.38088366e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 9.90924187e-01],\n",
" [ 1.74432465e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.98108740e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.98693802e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.49554183e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 4.91399295e+00],\n",
" [-2.08767018e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.30288132e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 6.46317890e-01, -3.19692150e-01, 3.19692150e-01,\n",
" -3.16765400e-01],\n",
" [ 2.23865227e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.80530076e-02, -1.20388755e+00, 1.20388755e+00,\n",
" -3.16765400e-01],\n",
" [ 1.23164387e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 9.90924187e-01],\n",
" [ 1.60828841e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 9.90924187e-01],\n",
" [-1.08050848e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.57913322e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.13757584e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.13586419e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.55952467e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.20830852e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 4.93624157e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.39818318e-04, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.61086473e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.82183399e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.24135617e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.16269576e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 6.64001790e-01],\n",
" [-2.95293467e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.93650940e-02, -1.46587138e+00, 1.46587138e+00,\n",
" -3.16765400e-01],\n",
" [-4.09581473e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.40264600e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.36518719e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-8.17999592e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.11690914e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.22576328e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.77391284e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.00575577e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 8.04111389e-01],\n",
" [ 5.89713243e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.89530781e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.08799496e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.19442727e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.09835875e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.38116091e-01, -5.48927996e-01, 5.48927996e-01,\n",
" 9.90924187e-01],\n",
" [-5.21249346e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 4.97634295e-01, -4.17936084e-01, 4.17936084e-01,\n",
" -3.16765400e-01],\n",
" [-2.06145005e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.94004568e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 9.90924187e-01],\n",
" [-4.30250050e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 7.36392710e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.70808011e-01, -5.48927996e-01, 5.48927996e-01,\n",
" -3.16765400e-01],\n",
" [ 2.65046264e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.04184150e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.78327497e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.78327497e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.16703587e+00, -3.29975814e+00, 3.29975814e+00,\n",
" -3.16765400e-01],\n",
" [-4.14208556e-02, 3.68015386e-01, -3.68015386e-01,\n",
" 8.04111389e-01],\n",
" [ 9.66204491e-02, -5.48927996e-01, 5.48927996e-01,\n",
" -3.16765400e-01],\n",
" [-2.47326042e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.58266008e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.13129843e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.24582337e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.01130733e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 5.82741678e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.11164819e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 8.04111389e-01],\n",
" [ 4.55311817e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 6.22168254e+00],\n",
" [-3.54365891e-01, -2.38281476e+00, 2.38281476e+00,\n",
" -3.16765400e-01],\n",
" [-9.98918531e-01, -1.46587138e+00, 1.46587138e+00,\n",
" 2.29861377e+00],\n",
" [-1.21824226e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 8.04111389e-01],\n",
" [ 9.83477993e-01, -2.38281476e+00, 2.38281476e+00,\n",
" -3.16765400e-01],\n",
" [-8.71827989e-01, -1.46587138e+00, 1.46587138e+00,\n",
" -3.16765400e-01],\n",
" [-1.49540358e-01, -3.19692150e-01, 3.19692150e-01,\n",
" -3.16765400e-01],\n",
" [-3.07015410e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.01600219e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.82375718e-01, 3.68015386e-01, -3.68015386e-01,\n",
" 6.64001790e-01],\n",
" [-7.64324490e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 4.24217914e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.61659203e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.44378628e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.56309818e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.38380348e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.59411468e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-4.45210951e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.46081357e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.15653089e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.46301400e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 5.37428148e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.23254415e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.71993021e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.63310644e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.63812376e-01, -3.19692150e-01, 3.19692150e-01,\n",
" -3.16765400e-01],\n",
" [-6.64534678e-01, -4.21670152e+00, 4.21670152e+00,\n",
" 9.90924187e-01],\n",
" [ 2.05511132e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 1.69820806e+00, -5.48927996e-01, 5.48927996e-01,\n",
" 2.29861377e+00],\n",
" [ 5.38352624e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.47932190e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.69519111e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-3.85213110e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 5.42146738e+00, 3.68015386e-01, -3.68015386e-01,\n",
" 4.16674176e+00],\n",
" [ 2.95276539e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-8.52394241e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-7.31627379e-01, -4.17936084e-01, 4.17936084e-01,\n",
" -3.16765400e-01],\n",
" [-1.77765563e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.53484690e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-6.71475302e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-2.08921254e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.31059313e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 6.03286020e-01, -3.19692150e-01, 3.19692150e-01,\n",
" -3.16765400e-01],\n",
" [ 8.63482311e-01, -4.17936084e-01, 4.17936084e-01,\n",
" -3.16765400e-01],\n",
" [-8.84783821e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-8.52085769e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.88033575e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.64435452e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-1.09670421e+00, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-8.22009730e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 2.66434389e-01, -4.21670152e+00, 4.21670152e+00,\n",
" -3.16765400e-01],\n",
" [-5.41762746e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-5.34512709e-02, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [-6.92297175e-01, -5.13364491e+00, 5.13364491e+00,\n",
" 3.60630336e+00],\n",
" [-9.14551387e-01, -1.20388755e+00, 1.20388755e+00,\n",
" -3.16765400e-01],\n",
" [-7.53220432e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01],\n",
" [ 3.23964452e-01, 3.68015386e-01, -3.68015386e-01,\n",
" -3.16765400e-01]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# standardizing the data\n",
"from sklearn.preprocessing import StandardScaler\n",
"scaler = StandardScaler()\n",
"new_df = scaler.fit_transform(x)\n",
"\n",
"# statistics of scaled data\n",
"pd.DataFrame(new_df).describe()\n",
"\n",
"display(new_df)\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "82afaeca",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([[ 4.00000000e+00, -1.42198814e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -1.49278251e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.76168192e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -8.63345004e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -4.20378940e-01, -4.17936084e-01,\n",
" 4.17936084e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 2.35741406e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 1.42682072e+00],\n",
" [ 4.00000000e+00, 2.09367034e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -5.02113725e-03, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -8.37124867e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -4.09119705e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -1.84551951e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -9.13933502e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.87273190e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -9.76862769e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.27892294e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -3.76730125e-01, -3.19692150e-01,\n",
" 3.19692150e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.85113885e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -3.59455683e-01, -4.44593737e+00,\n",
" 4.44593737e+00, -3.16765400e-01],\n",
" [ 4.00000000e+00, 5.46527137e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -3.21359367e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 2.01809466e-01, -1.00739969e+00,\n",
" 1.00739969e+00, -3.16765400e-01],\n",
" [ 4.00000000e+00, 4.25914511e-01, -4.17936084e-01,\n",
" 4.17936084e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 1.48335718e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 2.29861377e+00],\n",
" [ 4.00000000e+00, -1.47226816e-01, -3.29975814e+00,\n",
" 3.29975814e+00, -3.16765400e-01],\n",
" [ 4.00000000e+00, -6.64071029e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.43315903e-01, -4.17936084e-01,\n",
" 4.17936084e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.29434655e-01, -5.48927996e-01,\n",
" 5.48927996e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 1.56618290e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -1.45715397e+00, -3.19692150e-01,\n",
" 3.19692150e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -4.27473800e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -2.13856809e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 7.42869685e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 5.28761855e+00],\n",
" [ 4.00000000e+00, -1.62187718e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 1.63420008e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -9.87505060e-01, -4.21670152e+00,\n",
" 4.21670152e+00, -3.16765400e-01],\n",
" [ 4.00000000e+00, -7.44274739e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -6.33070514e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -7.52295015e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -6.57902526e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -6.75331204e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 4.57532910e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 3.56045560e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 8.59009465e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 6.64001790e-01],\n",
" [ 4.00000000e+00, 6.96291325e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, -4.23309426e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 2.73128142e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 9.90924187e-01],\n",
" [ 4.00000000e+00, 7.38088366e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 9.90924187e-01],\n",
" [ 4.00000000e+00, 1.74432465e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 1.98108740e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 1.98693802e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 1.49554183e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 4.91399295e+00],\n",
" [ 4.00000000e+00, -2.08767018e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 3.30288132e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 6.46317890e-01, -3.19692150e-01,\n",
" 3.19692150e-01, -3.16765400e-01],\n",
" [ 4.00000000e+00, 2.23865227e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -4.80530076e-02, -1.20388755e+00,\n",
" 1.20388755e+00, -3.16765400e-01],\n",
" [ 5.00000000e+00, 1.23164387e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 9.90924187e-01],\n",
" [ 5.00000000e+00, 1.60828841e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 9.90924187e-01],\n",
" [ 5.00000000e+00, -1.08050848e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -3.57913322e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -1.13757584e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 1.13586419e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -5.55952467e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -7.20830852e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 4.93624157e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -2.39818318e-04, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -7.61086473e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -2.82183399e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -3.24135617e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -3.16269576e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 6.64001790e-01],\n",
" [ 5.00000000e+00, -2.95293467e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -1.93650940e-02, -1.46587138e+00,\n",
" 1.46587138e+00, -3.16765400e-01],\n",
" [ 5.00000000e+00, -4.09581473e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -7.40264600e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -5.36518719e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -8.17999592e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -1.11690914e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 3.22576328e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -5.77391284e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 2.00575577e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 8.04111389e-01],\n",
" [ 5.00000000e+00, 5.89713243e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -3.89530781e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -7.08799496e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -7.19442727e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -5.09835875e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -4.38116091e-01, -5.48927996e-01,\n",
" 5.48927996e-01, 9.90924187e-01],\n",
" [ 5.00000000e+00, -5.21249346e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 4.97634295e-01, -4.17936084e-01,\n",
" 4.17936084e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -2.06145005e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -3.94004568e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 9.90924187e-01],\n",
" [ 5.00000000e+00, -4.30250050e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 7.36392710e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 1.70808011e-01, -5.48927996e-01,\n",
" 5.48927996e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 2.65046264e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -4.04184150e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -2.78327497e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -2.78327497e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -1.16703587e+00, -3.29975814e+00,\n",
" 3.29975814e+00, -3.16765400e-01],\n",
" [ 5.00000000e+00, -4.14208556e-02, 3.68015386e-01,\n",
" -3.68015386e-01, 8.04111389e-01],\n",
" [ 5.00000000e+00, 9.66204491e-02, -5.48927996e-01,\n",
" 5.48927996e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -2.47326042e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -5.58266008e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, -4.13129843e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 3.24582337e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 2.01130733e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 5.82741678e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 5.00000000e+00, 1.11164819e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 8.04111389e-01],\n",
" [ 5.00000000e+00, 4.55311817e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 6.22168254e+00],\n",
" [ 5.00000000e+00, -3.54365891e-01, -2.38281476e+00,\n",
" 2.38281476e+00, -3.16765400e-01],\n",
" [ 6.00000000e+00, -9.98918531e-01, -1.46587138e+00,\n",
" 1.46587138e+00, 2.29861377e+00],\n",
" [ 6.00000000e+00, -1.21824226e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 8.04111389e-01],\n",
" [ 6.00000000e+00, 9.83477993e-01, -2.38281476e+00,\n",
" 2.38281476e+00, -3.16765400e-01],\n",
" [ 6.00000000e+00, -8.71827989e-01, -1.46587138e+00,\n",
" 1.46587138e+00, -3.16765400e-01],\n",
" [ 6.00000000e+00, -1.49540358e-01, -3.19692150e-01,\n",
" 3.19692150e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -3.07015410e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 3.01600219e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 1.82375718e-01, 3.68015386e-01,\n",
" -3.68015386e-01, 6.64001790e-01],\n",
" [ 6.00000000e+00, -7.64324490e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 4.24217914e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -5.61659203e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 2.44378628e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 1.56309818e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -2.38380348e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -1.59411468e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -4.45210951e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -5.46081357e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 1.15653089e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -1.46301400e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 5.37428148e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -5.23254415e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -5.71993021e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -3.63310644e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, 2.63812376e-01, -3.19692150e-01,\n",
" 3.19692150e-01, -3.16765400e-01],\n",
" [ 6.00000000e+00, -6.64534678e-01, -4.21670152e+00,\n",
" 4.21670152e+00, 9.90924187e-01],\n",
" [ 6.00000000e+00, 2.05511132e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 1.69820806e+00, -5.48927996e-01,\n",
" 5.48927996e-01, 2.29861377e+00],\n",
" [ 7.00000000e+00, 5.38352624e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -5.47932190e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 2.69519111e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -3.85213110e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 5.42146738e+00, 3.68015386e-01,\n",
" -3.68015386e-01, 4.16674176e+00],\n",
" [ 7.00000000e+00, 2.95276539e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -8.52394241e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -7.31627379e-01, -4.17936084e-01,\n",
" 4.17936084e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -1.77765563e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -5.53484690e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -6.71475302e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -2.08921254e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 3.31059313e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 6.03286020e-01, -3.19692150e-01,\n",
" 3.19692150e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 8.63482311e-01, -4.17936084e-01,\n",
" 4.17936084e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -8.84783821e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -8.52085769e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -5.88033575e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -5.64435452e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -1.09670421e+00, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -8.22009730e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 2.66434389e-01, -4.21670152e+00,\n",
" 4.21670152e+00, -3.16765400e-01],\n",
" [ 7.00000000e+00, -5.41762746e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -5.34512709e-02, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, -6.92297175e-01, -5.13364491e+00,\n",
" 5.13364491e+00, 3.60630336e+00],\n",
" [ 7.00000000e+00, -9.14551387e-01, -1.20388755e+00,\n",
" 1.20388755e+00, -3.16765400e-01],\n",
" [ 7.00000000e+00, -7.53220432e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01],\n",
" [ 7.00000000e+00, 3.23964452e-01, 3.68015386e-01,\n",
" -3.68015386e-01, -3.16765400e-01]])"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"x = dataset.iloc[:, [2, 8, 10, 11, 12]].copy()\n",
"x[['total_duration', 'percentage_no_of_correct_responses', 'oer', 'cer']] = new_df\n",
"x.head()\n",
"x = x.to_numpy()\n",
"display(x)\n"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "5d1c61bf",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.datasets import make_classification\n",
"from sklearn.cluster import MeanShift\n",
"\n",
"# define the model\n",
"model = MeanShift()\n",
"# fit model and predict clusters\n",
"yhat = model.fit_predict(x)\n",
"# retrieve unique clusters\n",
"clusters = unique(yhat)"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "ac062128",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"[[ 4.79279279 -0.17014686 0.27567199 -0.27567199 -0.19713228]\n",
" [ 4.4 -0.60311786 -3.52899399 3.52899399 -0.3167654 ]\n",
" [ 4. 1.11920576 0.36801539 -0.36801539 5.10080575]\n",
" [ 7. 5.42146738 0.36801539 -0.36801539 4.16674176]\n",
" [ 7. 1.69820806 -0.548928 0.548928 2.29861377]\n",
" [ 7. 0.26643439 -4.21670152 4.21670152 -0.3167654 ]\n",
" [ 7. -0.69229717 -5.13364491 5.13364491 3.60630336]\n",
" [ 6. -0.66453468 -4.21670152 4.21670152 0.99092419]\n",
" [ 6. -0.99891853 -1.46587138 1.46587138 2.29861377]\n",
" [ 5. 5.82741678 0.36801539 -0.36801539 -0.3167654 ]\n",
" [ 5. 4.55311817 0.36801539 -0.36801539 6.22168254]]\n",
"Estimated clusters: 11\n"
]
}
],
"source": [
"ms = MeanShift()\n",
"ms.fit(x)\n",
"labels = ms.labels_\n",
"cluster_centers = ms.cluster_centers_\n",
"print(cluster_centers)\n",
"n_clusters_ = len(nm.unique(labels))\n",
"print(\"Estimated clusters:\", n_clusters_)"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "2e691585",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>total_duration</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>160</th>\n",
" <td>4</td>\n",
" <td>3459</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>161</th>\n",
" <td>4</td>\n",
" <td>3000</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>162</th>\n",
" <td>4</td>\n",
" <td>10888</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>163</th>\n",
" <td>4</td>\n",
" <td>7081</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>164</th>\n",
" <td>4</td>\n",
" <td>9953</td>\n",
" <td>85.714286</td>\n",
" <td>14.285714</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>319</th>\n",
" <td>7</td>\n",
" <td>12332</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>320</th>\n",
" <td>7</td>\n",
" <td>8190</td>\n",
" <td>0.000000</td>\n",
" <td>100.000000</td>\n",
" <td>50.0</td>\n",
" <td>6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>321</th>\n",
" <td>7</td>\n",
" <td>6749</td>\n",
" <td>71.428571</td>\n",
" <td>28.571429</td>\n",
" <td>0.0</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>322</th>\n",
" <td>7</td>\n",
" <td>7795</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>323</th>\n",
" <td>7</td>\n",
" <td>14779</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>164 rows × 6 columns</p>\n",
"</div>"
],
"text/plain": [
" child_age total_duration percentage_no_of_correct_responses \\\n",
"160 4 3459 100.000000 \n",
"161 4 3000 100.000000 \n",
"162 4 10888 100.000000 \n",
"163 4 7081 100.000000 \n",
"164 4 9953 85.714286 \n",
".. ... ... ... \n",
"319 7 12332 100.000000 \n",
"320 7 8190 0.000000 \n",
"321 7 6749 71.428571 \n",
"322 7 7795 100.000000 \n",
"323 7 14779 100.000000 \n",
"\n",
" oer cer clusters \n",
"160 0.000000 0.0 0 \n",
"161 0.000000 0.0 0 \n",
"162 0.000000 0.0 0 \n",
"163 0.000000 0.0 0 \n",
"164 14.285714 0.0 0 \n",
".. ... ... ... \n",
"319 0.000000 0.0 0 \n",
"320 100.000000 50.0 6 \n",
"321 28.571429 0.0 8 \n",
"322 0.000000 0.0 0 \n",
"323 0.000000 0.0 0 \n",
"\n",
"[164 rows x 6 columns]"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"new_df = dataset.iloc[:, [2, 8, 10, 11, 12]].copy()\n",
"new_df['clusters'] = yhat\n",
"new_df.head()\n",
"display(new_df)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "017f8397",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Silhouette Coefficient: 0.416\n",
"Calinski-Harabasz Index: 27.590\n",
"Davies-Bouldin Index: 0.519\n"
]
}
],
"source": [
"from sklearn.metrics import silhouette_score,calinski_harabasz_score,davies_bouldin_score\n",
"\n",
"print(\"Silhouette Coefficient: %0.3f\" % silhouette_score(x, yhat))\n",
"print(\"Calinski-Harabasz Index: %0.3f\" % calinski_harabasz_score(x, yhat))\n",
"print(\"Davies-Bouldin Index: %0.3f\" % davies_bouldin_score(x, yhat))"
]
},
{
"cell_type": "markdown",
"id": "900a0d3f",
"metadata": {},
"source": [
"# Cluster Analysis"
]
},
{
"cell_type": "markdown",
"id": "262e8a4f",
"metadata": {},
"source": [
"## Cluster 1"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "ba8fef3b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"145"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 0])"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "6c5b7397",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>total_duration</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>160</th>\n",
" <td>4</td>\n",
" <td>3459</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>161</th>\n",
" <td>4</td>\n",
" <td>3000</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>162</th>\n",
" <td>4</td>\n",
" <td>10888</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>163</th>\n",
" <td>4</td>\n",
" <td>7081</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>164</th>\n",
" <td>4</td>\n",
" <td>9953</td>\n",
" <td>85.714286</td>\n",
" <td>14.285714</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>316</th>\n",
" <td>7</td>\n",
" <td>7349</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>318</th>\n",
" <td>7</td>\n",
" <td>9166</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>319</th>\n",
" <td>7</td>\n",
" <td>12332</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>322</th>\n",
" <td>7</td>\n",
" <td>7795</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>323</th>\n",
" <td>7</td>\n",
" <td>14779</td>\n",
" <td>100.000000</td>\n",
" <td>0.000000</td>\n",
" <td>0.0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>145 rows × 6 columns</p>\n",
"</div>"
],
"text/plain": [
" child_age total_duration percentage_no_of_correct_responses oer \\\n",
"160 4 3459 100.000000 0.000000 \n",
"161 4 3000 100.000000 0.000000 \n",
"162 4 10888 100.000000 0.000000 \n",
"163 4 7081 100.000000 0.000000 \n",
"164 4 9953 85.714286 14.285714 \n",
".. ... ... ... ... \n",
"316 7 7349 100.000000 0.000000 \n",
"318 7 9166 100.000000 0.000000 \n",
"319 7 12332 100.000000 0.000000 \n",
"322 7 7795 100.000000 0.000000 \n",
"323 7 14779 100.000000 0.000000 \n",
"\n",
" cer clusters \n",
"160 0.0 0 \n",
"161 0.0 0 \n",
"162 0.0 0 \n",
"163 0.0 0 \n",
"164 0.0 0 \n",
".. ... ... \n",
"316 0.0 0 \n",
"318 0.0 0 \n",
"319 0.0 0 \n",
"322 0.0 0 \n",
"323 0.0 0 \n",
"\n",
"[145 rows x 6 columns]"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"display(cluster_0)\n",
"# cluster_0.boxplot(column =['CER'], grid = False)\n",
"# cluster_0.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "849d9447",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"total_duration min - 3000\n",
"total_duration max - 30387\n",
"\n",
"percentage_no_of_correct_responses min - 66.66666667\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 33.33333333\n",
"\n",
"cer min - 0.0\n",
"cer max - 22.22222222\n"
]
}
],
"source": [
"cluster_0 = new_df[new_df[\"clusters\"] == 0 ]\n",
"\n",
"maxVal = cluster_0['total_duration'].max()\n",
"minVal = cluster_0['total_duration'].min()\n",
"\n",
"print(\"total_duration min - \", minVal)\n",
"print(\"total_duration max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_0['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['oer'].max()\n",
"minVal = cluster_0['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_0['cer'].max()\n",
"minVal = cluster_0['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "dd8d7e4f",
"metadata": {},
"source": [
"## Cluster 2"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "f9ed816e",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"6"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 1])"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "e3eeb500",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>total_duration</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>177</th>\n",
" <td>4</td>\n",
" <td>10348</td>\n",
" <td>12.500000</td>\n",
" <td>87.500000</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>183</th>\n",
" <td>4</td>\n",
" <td>11724</td>\n",
" <td>33.333333</td>\n",
" <td>66.666667</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>194</th>\n",
" <td>4</td>\n",
" <td>6276</td>\n",
" <td>16.666667</td>\n",
" <td>83.333333</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>257</th>\n",
" <td>5</td>\n",
" <td>5112</td>\n",
" <td>33.333333</td>\n",
" <td>66.666667</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>268</th>\n",
" <td>5</td>\n",
" <td>10381</td>\n",
" <td>50.000000</td>\n",
" <td>50.000000</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>271</th>\n",
" <td>6</td>\n",
" <td>19055</td>\n",
" <td>50.000000</td>\n",
" <td>50.000000</td>\n",
" <td>0.0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age total_duration percentage_no_of_correct_responses oer \\\n",
"177 4 10348 12.500000 87.500000 \n",
"183 4 11724 33.333333 66.666667 \n",
"194 4 6276 16.666667 83.333333 \n",
"257 5 5112 33.333333 66.666667 \n",
"268 5 10381 50.000000 50.000000 \n",
"271 6 19055 50.000000 50.000000 \n",
"\n",
" cer clusters \n",
"177 0.0 1 \n",
"183 0.0 1 \n",
"194 0.0 1 \n",
"257 0.0 1 \n",
"268 0.0 1 \n",
"271 0.0 1 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"display(cluster_1)\n",
"#cluster_1.boxplot(column =['CER'], grid = False)\n",
"#cluster_1.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "2ab1bc45",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"total_duration min - 5112\n",
"total_duration max - 19055\n",
"\n",
"percentage_no_of_correct_responses min - 12.5\n",
"percentage_no_of_correct_responses max - 50.0\n",
"\n",
"oer min - 50.0\n",
"oer max - 87.5\n",
"\n",
"cer min - 0.0\n",
"cer max - 0.0\n"
]
}
],
"source": [
"cluster_1 = new_df[new_df[\"clusters\"] == 1 ]\n",
"\n",
"maxVal = cluster_1['total_duration'].max()\n",
"minVal = cluster_1['total_duration'].min()\n",
"\n",
"print(\"total_duration min - \", minVal)\n",
"print(\"total_duration max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_1['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['oer'].max()\n",
"minVal = cluster_1['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_1['cer'].max()\n",
"minVal = cluster_1['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "e62b9a30",
"metadata": {},
"source": [
"## Cluster 3"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "105ff3ad",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"3"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 2])"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "9c9ac4a6",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>total_duration</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>182</th>\n",
" <td>4</td>\n",
" <td>22296</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>33.333333</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>191</th>\n",
" <td>4</td>\n",
" <td>17495</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>71.428571</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>210</th>\n",
" <td>4</td>\n",
" <td>22375</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>66.666667</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age total_duration percentage_no_of_correct_responses oer \\\n",
"182 4 22296 100.0 0.0 \n",
"191 4 17495 100.0 0.0 \n",
"210 4 22375 100.0 0.0 \n",
"\n",
" cer clusters \n",
"182 33.333333 2 \n",
"191 71.428571 2 \n",
"210 66.666667 2 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_2 = new_df[new_df[\"clusters\"] == 2 ]\n",
"display(cluster_2)\n",
"#cluster_2.boxplot(column =['CER'], grid = False)\n",
"#cluster_2.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 18,
"id": "09b1596d",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"total_duration min - 17495\n",
"total_duration max - 22375\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n",
"\n",
"cer min - 33.33333333\n",
"cer max - 71.42857143\n"
]
}
],
"source": [
"cluster_2 = new_df[new_df[\"clusters\"] == 2 ]\n",
"\n",
"maxVal = cluster_2['total_duration'].max()\n",
"minVal = cluster_2['total_duration'].min()\n",
"\n",
"print(\"total_duration min - \", minVal)\n",
"print(\"total_duration max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_2['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_2['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_2['oer'].max()\n",
"minVal = cluster_2['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_2['cer'].max()\n",
"minVal = cluster_2['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "markdown",
"id": "f5704cf3",
"metadata": {},
"source": [
"## Cluster 3"
]
},
{
"cell_type": "code",
"execution_count": 19,
"id": "a38aef5c",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"1"
]
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == 3])"
]
},
{
"cell_type": "code",
"execution_count": 20,
"id": "764b57a9",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>total_duration</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>300</th>\n",
" <td>7</td>\n",
" <td>47829</td>\n",
" <td>100.0</td>\n",
" <td>0.0</td>\n",
" <td>57.142857</td>\n",
" <td>3</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" child_age total_duration percentage_no_of_correct_responses oer \\\n",
"300 7 47829 100.0 0.0 \n",
"\n",
" cer clusters \n",
"300 57.142857 3 "
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"cluster_3 = new_df[new_df[\"clusters\"] == 3 ]\n",
"display(cluster_3)\n",
"#cluster_2.boxplot(column =['CER'], grid = False)\n",
"#cluster_2.boxplot(column =['OER'], grid = False)"
]
},
{
"cell_type": "code",
"execution_count": 21,
"id": "c8d202ee",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"total_duration min - 47829\n",
"total_duration max - 47829\n",
"\n",
"percentage_no_of_correct_responses min - 100.0\n",
"percentage_no_of_correct_responses max - 100.0\n",
"\n",
"oer min - 0.0\n",
"oer max - 0.0\n",
"\n",
"cer min - 57.14285714\n",
"cer max - 57.14285714\n"
]
}
],
"source": [
"cluster_3 = new_df[new_df[\"clusters\"] == 3 ]\n",
"\n",
"maxVal = cluster_3['total_duration'].max()\n",
"minVal = cluster_3['total_duration'].min()\n",
"\n",
"print(\"total_duration min - \", minVal)\n",
"print(\"total_duration max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_3['percentage_no_of_correct_responses'].max()\n",
"minVal = cluster_3['percentage_no_of_correct_responses'].min()\n",
"\n",
"print(\"percentage_no_of_correct_responses min - \", minVal)\n",
"print(\"percentage_no_of_correct_responses max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_3['oer'].max()\n",
"minVal = cluster_3['oer'].min()\n",
"\n",
"print(\"oer min - \", minVal)\n",
"print(\"oer max - \", maxVal)\n",
"print()\n",
"\n",
"maxVal = cluster_3['cer'].max()\n",
"minVal = cluster_3['cer'].min()\n",
"\n",
"print(\"cer min - \", minVal)\n",
"print(\"cer max - \", maxVal)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "74a86c20",
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": 22,
"id": "c3a6eb79",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0"
]
},
"execution_count": 22,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(new_df[new_df[\"clusters\"] == -1])"
]
},
{
"cell_type": "code",
"execution_count": 23,
"id": "92f1117a",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>child_age</th>\n",
" <th>total_duration</th>\n",
" <th>percentage_no_of_correct_responses</th>\n",
" <th>oer</th>\n",
" <th>cer</th>\n",
" <th>clusters</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
"Empty DataFrame\n",
"Columns: [child_age, total_duration, percentage_no_of_correct_responses, oer, cer, clusters]\n",
"Index: []"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"outliers = new_df[new_df[\"clusters\"] == -1 ]\n",
"display(outliers)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "f37f6f4f",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
This source diff could not be displayed because it is too large. You can view the blob instead.
This source diff could not be displayed because it is too large. You can view the blob instead.
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment