Skip to content

Instantly share code, notes, and snippets.

@pree62
Created August 3, 2023 10:03
Show Gist options
  • Save pree62/3618875aad609e513049fec8c3717c23 to your computer and use it in GitHub Desktop.
Save pree62/3618875aad609e513049fec8c3717c23 to your computer and use it in GitHub Desktop.
!excelR/assignments/Gists/crime_data_clustering_assgn.ipynb
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"metadata": {
"id": "O2orI1mwWNkR"
},
"cell_type": "markdown",
"source": "# Hierarchy Clustering"
},
{
"metadata": {
"id": "MBFNU04hMOLK",
"trusted": false
},
"cell_type": "code",
"source": "import pandas as pd \nimport numpy as np\nimport matplotlib.pyplot as plt\n",
"execution_count": null,
"outputs": []
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "C7VpdeUuMpZp",
"outputId": "4b39747a-28e3-47f8-ee1c-fd35cf17742e",
"trusted": false
},
"cell_type": "code",
"source": "df = pd.read_csv(\"crime_data.csv\")\ndf",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-43ede5bf-95a6-45df-bcfd-60af9dd9bc8d\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Unnamed: 0</th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>Alabama</td>\n <td>13.2</td>\n <td>236</td>\n <td>58</td>\n <td>21.2</td>\n </tr>\n <tr>\n <th>1</th>\n <td>Alaska</td>\n <td>10.0</td>\n <td>263</td>\n <td>48</td>\n <td>44.5</td>\n </tr>\n <tr>\n <th>2</th>\n <td>Arizona</td>\n <td>8.1</td>\n <td>294</td>\n <td>80</td>\n <td>31.0</td>\n </tr>\n <tr>\n <th>3</th>\n <td>Arkansas</td>\n <td>8.8</td>\n <td>190</td>\n <td>50</td>\n <td>19.5</td>\n </tr>\n <tr>\n <th>4</th>\n <td>California</td>\n <td>9.0</td>\n <td>276</td>\n <td>91</td>\n <td>40.6</td>\n </tr>\n <tr>\n <th>5</th>\n <td>Colorado</td>\n <td>7.9</td>\n <td>204</td>\n <td>78</td>\n <td>38.7</td>\n </tr>\n <tr>\n <th>6</th>\n <td>Connecticut</td>\n <td>3.3</td>\n <td>110</td>\n <td>77</td>\n <td>11.1</td>\n </tr>\n <tr>\n <th>7</th>\n <td>Delaware</td>\n <td>5.9</td>\n <td>238</td>\n <td>72</td>\n <td>15.8</td>\n </tr>\n <tr>\n <th>8</th>\n <td>Florida</td>\n <td>15.4</td>\n <td>335</td>\n <td>80</td>\n <td>31.9</td>\n </tr>\n <tr>\n <th>9</th>\n <td>Georgia</td>\n <td>17.4</td>\n <td>211</td>\n <td>60</td>\n <td>25.8</td>\n </tr>\n <tr>\n <th>10</th>\n <td>Hawaii</td>\n <td>5.3</td>\n <td>46</td>\n <td>83</td>\n <td>20.2</td>\n </tr>\n <tr>\n <th>11</th>\n <td>Idaho</td>\n <td>2.6</td>\n <td>120</td>\n <td>54</td>\n <td>14.2</td>\n </tr>\n <tr>\n <th>12</th>\n <td>Illinois</td>\n <td>10.4</td>\n <td>249</td>\n <td>83</td>\n <td>24.0</td>\n </tr>\n <tr>\n <th>13</th>\n <td>Indiana</td>\n <td>7.2</td>\n <td>113</td>\n <td>65</td>\n <td>21.0</td>\n </tr>\n <tr>\n <th>14</th>\n <td>Iowa</td>\n <td>2.2</td>\n <td>56</td>\n <td>57</td>\n <td>11.3</td>\n </tr>\n <tr>\n <th>15</th>\n <td>Kansas</td>\n <td>6.0</td>\n <td>115</td>\n <td>66</td>\n <td>18.0</td>\n </tr>\n <tr>\n <th>16</th>\n <td>Kentucky</td>\n <td>9.7</td>\n <td>109</td>\n <td>52</td>\n <td>16.3</td>\n </tr>\n <tr>\n <th>17</th>\n <td>Louisiana</td>\n <td>15.4</td>\n <td>249</td>\n <td>66</td>\n <td>22.2</td>\n </tr>\n <tr>\n <th>18</th>\n <td>Maine</td>\n <td>2.1</td>\n <td>83</td>\n <td>51</td>\n <td>7.8</td>\n </tr>\n <tr>\n <th>19</th>\n <td>Maryland</td>\n <td>11.3</td>\n <td>300</td>\n <td>67</td>\n <td>27.8</td>\n </tr>\n <tr>\n <th>20</th>\n <td>Massachusetts</td>\n <td>4.4</td>\n <td>149</td>\n <td>85</td>\n <td>16.3</td>\n </tr>\n <tr>\n <th>21</th>\n <td>Michigan</td>\n <td>12.1</td>\n <td>255</td>\n <td>74</td>\n <td>35.1</td>\n </tr>\n <tr>\n <th>22</th>\n <td>Minnesota</td>\n <td>2.7</td>\n <td>72</td>\n <td>66</td>\n <td>14.9</td>\n </tr>\n <tr>\n <th>23</th>\n <td>Mississippi</td>\n <td>16.1</td>\n <td>259</td>\n <td>44</td>\n <td>17.1</td>\n </tr>\n <tr>\n <th>24</th>\n <td>Missouri</td>\n <td>9.0</td>\n <td>178</td>\n <td>70</td>\n <td>28.2</td>\n </tr>\n <tr>\n <th>25</th>\n <td>Montana</td>\n <td>6.0</td>\n <td>109</td>\n <td>53</td>\n <td>16.4</td>\n </tr>\n <tr>\n <th>26</th>\n <td>Nebraska</td>\n <td>4.3</td>\n <td>102</td>\n <td>62</td>\n <td>16.5</td>\n </tr>\n <tr>\n <th>27</th>\n <td>Nevada</td>\n <td>12.2</td>\n <td>252</td>\n <td>81</td>\n <td>46.0</td>\n </tr>\n <tr>\n <th>28</th>\n <td>New Hampshire</td>\n <td>2.1</td>\n <td>57</td>\n <td>56</td>\n <td>9.5</td>\n </tr>\n <tr>\n <th>29</th>\n <td>New Jersey</td>\n <td>7.4</td>\n <td>159</td>\n <td>89</td>\n <td>18.8</td>\n </tr>\n <tr>\n <th>30</th>\n <td>New Mexico</td>\n <td>11.4</td>\n <td>285</td>\n <td>70</td>\n <td>32.1</td>\n </tr>\n <tr>\n <th>31</th>\n <td>New York</td>\n <td>11.1</td>\n <td>254</td>\n <td>86</td>\n <td>26.1</td>\n </tr>\n <tr>\n <th>32</th>\n <td>North Carolina</td>\n <td>13.0</td>\n <td>337</td>\n <td>45</td>\n <td>16.1</td>\n </tr>\n <tr>\n <th>33</th>\n <td>North Dakota</td>\n <td>0.8</td>\n <td>45</td>\n <td>44</td>\n <td>7.3</td>\n </tr>\n <tr>\n <th>34</th>\n <td>Ohio</td>\n <td>7.3</td>\n <td>120</td>\n <td>75</td>\n <td>21.4</td>\n </tr>\n <tr>\n <th>35</th>\n <td>Oklahoma</td>\n <td>6.6</td>\n <td>151</td>\n <td>68</td>\n <td>20.0</td>\n </tr>\n <tr>\n <th>36</th>\n <td>Oregon</td>\n <td>4.9</td>\n <td>159</td>\n <td>67</td>\n <td>29.3</td>\n </tr>\n <tr>\n <th>37</th>\n <td>Pennsylvania</td>\n <td>6.3</td>\n <td>106</td>\n <td>72</td>\n <td>14.9</td>\n </tr>\n <tr>\n <th>38</th>\n <td>Rhode Island</td>\n <td>3.4</td>\n <td>174</td>\n <td>87</td>\n <td>8.3</td>\n </tr>\n <tr>\n <th>39</th>\n <td>South Carolina</td>\n <td>14.4</td>\n <td>279</td>\n <td>48</td>\n <td>22.5</td>\n </tr>\n <tr>\n <th>40</th>\n <td>South Dakota</td>\n <td>3.8</td>\n <td>86</td>\n <td>45</td>\n <td>12.8</td>\n </tr>\n <tr>\n <th>41</th>\n <td>Tennessee</td>\n <td>13.2</td>\n <td>188</td>\n <td>59</td>\n <td>26.9</td>\n </tr>\n <tr>\n <th>42</th>\n <td>Texas</td>\n <td>12.7</td>\n <td>201</td>\n <td>80</td>\n <td>25.5</td>\n </tr>\n <tr>\n <th>43</th>\n <td>Utah</td>\n <td>3.2</td>\n <td>120</td>\n <td>80</td>\n <td>22.9</td>\n </tr>\n <tr>\n <th>44</th>\n <td>Vermont</td>\n <td>2.2</td>\n <td>48</td>\n <td>32</td>\n <td>11.2</td>\n </tr>\n <tr>\n <th>45</th>\n <td>Virginia</td>\n <td>8.5</td>\n <td>156</td>\n <td>63</td>\n <td>20.7</td>\n </tr>\n <tr>\n <th>46</th>\n <td>Washington</td>\n <td>4.0</td>\n <td>145</td>\n <td>73</td>\n <td>26.2</td>\n </tr>\n <tr>\n <th>47</th>\n <td>West Virginia</td>\n <td>5.7</td>\n <td>81</td>\n <td>39</td>\n <td>9.3</td>\n </tr>\n <tr>\n <th>48</th>\n <td>Wisconsin</td>\n <td>2.6</td>\n <td>53</td>\n <td>66</td>\n <td>10.8</td>\n </tr>\n <tr>\n <th>49</th>\n <td>Wyoming</td>\n <td>6.8</td>\n <td>161</td>\n <td>60</td>\n <td>15.6</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-43ede5bf-95a6-45df-bcfd-60af9dd9bc8d')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-43ede5bf-95a6-45df-bcfd-60af9dd9bc8d button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-43ede5bf-95a6-45df-bcfd-60af9dd9bc8d');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Unnamed: 0 Murder Assault UrbanPop Rape\n0 Alabama 13.2 236 58 21.2\n1 Alaska 10.0 263 48 44.5\n2 Arizona 8.1 294 80 31.0\n3 Arkansas 8.8 190 50 19.5\n4 California 9.0 276 91 40.6\n5 Colorado 7.9 204 78 38.7\n6 Connecticut 3.3 110 77 11.1\n7 Delaware 5.9 238 72 15.8\n8 Florida 15.4 335 80 31.9\n9 Georgia 17.4 211 60 25.8\n10 Hawaii 5.3 46 83 20.2\n11 Idaho 2.6 120 54 14.2\n12 Illinois 10.4 249 83 24.0\n13 Indiana 7.2 113 65 21.0\n14 Iowa 2.2 56 57 11.3\n15 Kansas 6.0 115 66 18.0\n16 Kentucky 9.7 109 52 16.3\n17 Louisiana 15.4 249 66 22.2\n18 Maine 2.1 83 51 7.8\n19 Maryland 11.3 300 67 27.8\n20 Massachusetts 4.4 149 85 16.3\n21 Michigan 12.1 255 74 35.1\n22 Minnesota 2.7 72 66 14.9\n23 Mississippi 16.1 259 44 17.1\n24 Missouri 9.0 178 70 28.2\n25 Montana 6.0 109 53 16.4\n26 Nebraska 4.3 102 62 16.5\n27 Nevada 12.2 252 81 46.0\n28 New Hampshire 2.1 57 56 9.5\n29 New Jersey 7.4 159 89 18.8\n30 New Mexico 11.4 285 70 32.1\n31 New York 11.1 254 86 26.1\n32 North Carolina 13.0 337 45 16.1\n33 North Dakota 0.8 45 44 7.3\n34 Ohio 7.3 120 75 21.4\n35 Oklahoma 6.6 151 68 20.0\n36 Oregon 4.9 159 67 29.3\n37 Pennsylvania 6.3 106 72 14.9\n38 Rhode Island 3.4 174 87 8.3\n39 South Carolina 14.4 279 48 22.5\n40 South Dakota 3.8 86 45 12.8\n41 Tennessee 13.2 188 59 26.9\n42 Texas 12.7 201 80 25.5\n43 Utah 3.2 120 80 22.9\n44 Vermont 2.2 48 32 11.2\n45 Virginia 8.5 156 63 20.7\n46 Washington 4.0 145 73 26.2\n47 West Virginia 5.7 81 39 9.3\n48 Wisconsin 2.6 53 66 10.8\n49 Wyoming 6.8 161 60 15.6"
},
"execution_count": 29,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "hlxXCyCXa_1G",
"outputId": "0cfb979e-18d9-4e0f-d883-27531239bcab",
"trusted": false
},
"cell_type": "code",
"source": "df.info()",
"execution_count": null,
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": "<class 'pandas.core.frame.DataFrame'>\nRangeIndex: 50 entries, 0 to 49\nData columns (total 5 columns):\n # Column Non-Null Count Dtype \n--- ------ -------------- ----- \n 0 Unnamed: 0 50 non-null object \n 1 Murder 50 non-null float64\n 2 Assault 50 non-null int64 \n 3 UrbanPop 50 non-null int64 \n 4 Rape 50 non-null float64\ndtypes: float64(2), int64(2), object(1)\nmemory usage: 2.1+ KB\n"
}
]
},
{
"metadata": {
"id": "uFz2CLSRM3_X",
"trusted": false
},
"cell_type": "code",
"source": "def norm_function(i):\n x = (i-i.min())/(i.max()-i.min())\n return (x)",
"execution_count": null,
"outputs": []
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "8xLTia4CNYdc",
"outputId": "e7f3c939-62f3-4162-a0b9-7e6e11dbc4c1",
"trusted": false
},
"cell_type": "code",
"source": "df_norm = norm_function(df.iloc[:,1:])\ndf_norm",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-fa4b1e91-f56a-4d5a-bde0-269a588278cf\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>0.746988</td>\n <td>0.654110</td>\n <td>0.440678</td>\n <td>0.359173</td>\n </tr>\n <tr>\n <th>1</th>\n <td>0.554217</td>\n <td>0.746575</td>\n <td>0.271186</td>\n <td>0.961240</td>\n </tr>\n <tr>\n <th>2</th>\n <td>0.439759</td>\n <td>0.852740</td>\n <td>0.813559</td>\n <td>0.612403</td>\n </tr>\n <tr>\n <th>3</th>\n <td>0.481928</td>\n <td>0.496575</td>\n <td>0.305085</td>\n <td>0.315245</td>\n </tr>\n <tr>\n <th>4</th>\n <td>0.493976</td>\n <td>0.791096</td>\n <td>1.000000</td>\n <td>0.860465</td>\n </tr>\n <tr>\n <th>5</th>\n <td>0.427711</td>\n <td>0.544521</td>\n <td>0.779661</td>\n <td>0.811370</td>\n </tr>\n <tr>\n <th>6</th>\n <td>0.150602</td>\n <td>0.222603</td>\n <td>0.762712</td>\n <td>0.098191</td>\n </tr>\n <tr>\n <th>7</th>\n <td>0.307229</td>\n <td>0.660959</td>\n <td>0.677966</td>\n <td>0.219638</td>\n </tr>\n <tr>\n <th>8</th>\n <td>0.879518</td>\n <td>0.993151</td>\n <td>0.813559</td>\n <td>0.635659</td>\n </tr>\n <tr>\n <th>9</th>\n <td>1.000000</td>\n <td>0.568493</td>\n <td>0.474576</td>\n <td>0.478036</td>\n </tr>\n <tr>\n <th>10</th>\n <td>0.271084</td>\n <td>0.003425</td>\n <td>0.864407</td>\n <td>0.333333</td>\n </tr>\n <tr>\n <th>11</th>\n <td>0.108434</td>\n <td>0.256849</td>\n <td>0.372881</td>\n <td>0.178295</td>\n </tr>\n <tr>\n <th>12</th>\n <td>0.578313</td>\n <td>0.698630</td>\n <td>0.864407</td>\n <td>0.431525</td>\n </tr>\n <tr>\n <th>13</th>\n <td>0.385542</td>\n <td>0.232877</td>\n <td>0.559322</td>\n <td>0.354005</td>\n </tr>\n <tr>\n <th>14</th>\n <td>0.084337</td>\n <td>0.037671</td>\n <td>0.423729</td>\n <td>0.103359</td>\n </tr>\n <tr>\n <th>15</th>\n <td>0.313253</td>\n <td>0.239726</td>\n <td>0.576271</td>\n <td>0.276486</td>\n </tr>\n <tr>\n <th>16</th>\n <td>0.536145</td>\n <td>0.219178</td>\n <td>0.338983</td>\n <td>0.232558</td>\n </tr>\n <tr>\n <th>17</th>\n <td>0.879518</td>\n <td>0.698630</td>\n <td>0.576271</td>\n <td>0.385013</td>\n </tr>\n <tr>\n <th>18</th>\n <td>0.078313</td>\n <td>0.130137</td>\n <td>0.322034</td>\n <td>0.012920</td>\n </tr>\n <tr>\n <th>19</th>\n <td>0.632530</td>\n <td>0.873288</td>\n <td>0.593220</td>\n <td>0.529716</td>\n </tr>\n <tr>\n <th>20</th>\n <td>0.216867</td>\n <td>0.356164</td>\n <td>0.898305</td>\n <td>0.232558</td>\n </tr>\n <tr>\n <th>21</th>\n <td>0.680723</td>\n <td>0.719178</td>\n <td>0.711864</td>\n <td>0.718346</td>\n </tr>\n <tr>\n <th>22</th>\n <td>0.114458</td>\n <td>0.092466</td>\n <td>0.576271</td>\n <td>0.196382</td>\n </tr>\n <tr>\n <th>23</th>\n <td>0.921687</td>\n <td>0.732877</td>\n <td>0.203390</td>\n <td>0.253230</td>\n </tr>\n <tr>\n <th>24</th>\n <td>0.493976</td>\n <td>0.455479</td>\n <td>0.644068</td>\n <td>0.540052</td>\n </tr>\n <tr>\n <th>25</th>\n <td>0.313253</td>\n <td>0.219178</td>\n <td>0.355932</td>\n <td>0.235142</td>\n </tr>\n <tr>\n <th>26</th>\n <td>0.210843</td>\n <td>0.195205</td>\n <td>0.508475</td>\n <td>0.237726</td>\n </tr>\n <tr>\n <th>27</th>\n <td>0.686747</td>\n <td>0.708904</td>\n <td>0.830508</td>\n <td>1.000000</td>\n </tr>\n <tr>\n <th>28</th>\n <td>0.078313</td>\n <td>0.041096</td>\n <td>0.406780</td>\n <td>0.056848</td>\n </tr>\n <tr>\n <th>29</th>\n <td>0.397590</td>\n <td>0.390411</td>\n <td>0.966102</td>\n <td>0.297158</td>\n </tr>\n <tr>\n <th>30</th>\n <td>0.638554</td>\n <td>0.821918</td>\n <td>0.644068</td>\n <td>0.640827</td>\n </tr>\n <tr>\n <th>31</th>\n <td>0.620482</td>\n <td>0.715753</td>\n <td>0.915254</td>\n <td>0.485788</td>\n </tr>\n <tr>\n <th>32</th>\n <td>0.734940</td>\n <td>1.000000</td>\n <td>0.220339</td>\n <td>0.227390</td>\n </tr>\n <tr>\n <th>33</th>\n <td>0.000000</td>\n <td>0.000000</td>\n <td>0.203390</td>\n <td>0.000000</td>\n </tr>\n <tr>\n <th>34</th>\n <td>0.391566</td>\n <td>0.256849</td>\n <td>0.728814</td>\n <td>0.364341</td>\n </tr>\n <tr>\n <th>35</th>\n <td>0.349398</td>\n <td>0.363014</td>\n <td>0.610169</td>\n <td>0.328165</td>\n </tr>\n <tr>\n <th>36</th>\n <td>0.246988</td>\n <td>0.390411</td>\n <td>0.593220</td>\n <td>0.568475</td>\n </tr>\n <tr>\n <th>37</th>\n <td>0.331325</td>\n <td>0.208904</td>\n <td>0.677966</td>\n <td>0.196382</td>\n </tr>\n <tr>\n <th>38</th>\n <td>0.156627</td>\n <td>0.441781</td>\n <td>0.932203</td>\n <td>0.025840</td>\n </tr>\n <tr>\n <th>39</th>\n <td>0.819277</td>\n <td>0.801370</td>\n <td>0.271186</td>\n <td>0.392765</td>\n </tr>\n <tr>\n <th>40</th>\n <td>0.180723</td>\n <td>0.140411</td>\n <td>0.220339</td>\n <td>0.142119</td>\n </tr>\n <tr>\n <th>41</th>\n <td>0.746988</td>\n <td>0.489726</td>\n <td>0.457627</td>\n <td>0.506460</td>\n </tr>\n <tr>\n <th>42</th>\n <td>0.716867</td>\n <td>0.534247</td>\n <td>0.813559</td>\n <td>0.470284</td>\n </tr>\n <tr>\n <th>43</th>\n <td>0.144578</td>\n <td>0.256849</td>\n <td>0.813559</td>\n <td>0.403101</td>\n </tr>\n <tr>\n <th>44</th>\n <td>0.084337</td>\n <td>0.010274</td>\n <td>0.000000</td>\n <td>0.100775</td>\n </tr>\n <tr>\n <th>45</th>\n <td>0.463855</td>\n <td>0.380137</td>\n <td>0.525424</td>\n <td>0.346253</td>\n </tr>\n <tr>\n <th>46</th>\n <td>0.192771</td>\n <td>0.342466</td>\n <td>0.694915</td>\n <td>0.488372</td>\n </tr>\n <tr>\n <th>47</th>\n <td>0.295181</td>\n <td>0.123288</td>\n <td>0.118644</td>\n <td>0.051680</td>\n </tr>\n <tr>\n <th>48</th>\n <td>0.108434</td>\n <td>0.027397</td>\n <td>0.576271</td>\n <td>0.090439</td>\n </tr>\n <tr>\n <th>49</th>\n <td>0.361446</td>\n <td>0.397260</td>\n <td>0.474576</td>\n <td>0.214470</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-fa4b1e91-f56a-4d5a-bde0-269a588278cf')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-fa4b1e91-f56a-4d5a-bde0-269a588278cf button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-fa4b1e91-f56a-4d5a-bde0-269a588278cf');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Murder Assault UrbanPop Rape\n0 0.746988 0.654110 0.440678 0.359173\n1 0.554217 0.746575 0.271186 0.961240\n2 0.439759 0.852740 0.813559 0.612403\n3 0.481928 0.496575 0.305085 0.315245\n4 0.493976 0.791096 1.000000 0.860465\n5 0.427711 0.544521 0.779661 0.811370\n6 0.150602 0.222603 0.762712 0.098191\n7 0.307229 0.660959 0.677966 0.219638\n8 0.879518 0.993151 0.813559 0.635659\n9 1.000000 0.568493 0.474576 0.478036\n10 0.271084 0.003425 0.864407 0.333333\n11 0.108434 0.256849 0.372881 0.178295\n12 0.578313 0.698630 0.864407 0.431525\n13 0.385542 0.232877 0.559322 0.354005\n14 0.084337 0.037671 0.423729 0.103359\n15 0.313253 0.239726 0.576271 0.276486\n16 0.536145 0.219178 0.338983 0.232558\n17 0.879518 0.698630 0.576271 0.385013\n18 0.078313 0.130137 0.322034 0.012920\n19 0.632530 0.873288 0.593220 0.529716\n20 0.216867 0.356164 0.898305 0.232558\n21 0.680723 0.719178 0.711864 0.718346\n22 0.114458 0.092466 0.576271 0.196382\n23 0.921687 0.732877 0.203390 0.253230\n24 0.493976 0.455479 0.644068 0.540052\n25 0.313253 0.219178 0.355932 0.235142\n26 0.210843 0.195205 0.508475 0.237726\n27 0.686747 0.708904 0.830508 1.000000\n28 0.078313 0.041096 0.406780 0.056848\n29 0.397590 0.390411 0.966102 0.297158\n30 0.638554 0.821918 0.644068 0.640827\n31 0.620482 0.715753 0.915254 0.485788\n32 0.734940 1.000000 0.220339 0.227390\n33 0.000000 0.000000 0.203390 0.000000\n34 0.391566 0.256849 0.728814 0.364341\n35 0.349398 0.363014 0.610169 0.328165\n36 0.246988 0.390411 0.593220 0.568475\n37 0.331325 0.208904 0.677966 0.196382\n38 0.156627 0.441781 0.932203 0.025840\n39 0.819277 0.801370 0.271186 0.392765\n40 0.180723 0.140411 0.220339 0.142119\n41 0.746988 0.489726 0.457627 0.506460\n42 0.716867 0.534247 0.813559 0.470284\n43 0.144578 0.256849 0.813559 0.403101\n44 0.084337 0.010274 0.000000 0.100775\n45 0.463855 0.380137 0.525424 0.346253\n46 0.192771 0.342466 0.694915 0.488372\n47 0.295181 0.123288 0.118644 0.051680\n48 0.108434 0.027397 0.576271 0.090439\n49 0.361446 0.397260 0.474576 0.214470"
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 413
},
"id": "x3Zb18ixNwUM",
"outputId": "ee41b7dd-ccd8-4fc5-f3dd-4484a0ddba38",
"trusted": false
},
"cell_type": "code",
"source": "from scipy.cluster.hierarchy import linkage\nimport scipy.cluster.hierarchy as sch\nz = linkage(df_norm,method=\"average\",metric=\"euclidean\")\nplt.figure(figsize=(35, 12))\nplt.title('Hierarchical Clustering Dendrogram')\nplt.xlabel('Index')\nplt.ylabel('Distance')\nsch.dendrogram(z)\nplt.show() ",
"execution_count": null,
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": "<Figure size 2520x864 with 1 Axes>"
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
]
},
{
"metadata": {
"id": "XJckHrEHUP83",
"trusted": false
},
"cell_type": "code",
"source": "from sklearn.cluster import AgglomerativeClustering\nimport warnings \nwarnings.filterwarnings(\"ignore\")\nh_complete = AgglomerativeClustering(n_clusters=4,linkage=\"average\",affinity=\"euclidean\").fit(df_norm)\ncluster_labels=pd.Series(h_complete.labels_)\ncluster_labels\ndf['clust']=cluster_labels # creating a new column and assigning clusters\n#df",
"execution_count": null,
"outputs": []
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 206
},
"id": "idP0l5oJV6Ye",
"outputId": "749088c3-966f-4faf-e7ee-f0d893bb82ea",
"trusted": false
},
"cell_type": "code",
"source": "df.iloc[:,1:].groupby(df.clust).mean()",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-3cfecaea-8c9a-4fc3-bce6-d61e9dd51aaf\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n <th>clust</th>\n </tr>\n <tr>\n <th>clust</th>\n <th></th>\n <th></th>\n <th></th>\n <th></th>\n <th></th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>4.870000</td>\n <td>114.433333</td>\n <td>63.633333</td>\n <td>15.943333</td>\n <td>0.0</td>\n </tr>\n <tr>\n <th>1</th>\n <td>10.883333</td>\n <td>256.916667</td>\n <td>78.333333</td>\n <td>32.250000</td>\n <td>1.0</td>\n </tr>\n <tr>\n <th>2</th>\n <td>10.000000</td>\n <td>263.000000</td>\n <td>48.000000</td>\n <td>44.500000</td>\n <td>2.0</td>\n </tr>\n <tr>\n <th>3</th>\n <td>14.671429</td>\n <td>251.285714</td>\n <td>54.285714</td>\n <td>21.685714</td>\n <td>3.0</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-3cfecaea-8c9a-4fc3-bce6-d61e9dd51aaf')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-3cfecaea-8c9a-4fc3-bce6-d61e9dd51aaf button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-3cfecaea-8c9a-4fc3-bce6-d61e9dd51aaf');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Murder Assault UrbanPop Rape clust\nclust \n0 4.870000 114.433333 63.633333 15.943333 0.0\n1 10.883333 256.916667 78.333333 32.250000 1.0\n2 10.000000 263.000000 48.000000 44.500000 2.0\n3 14.671429 251.285714 54.285714 21.685714 3.0"
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"id": "3E2ULJEuWhUS"
},
"cell_type": "markdown",
"source": "# K Means Clustering"
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 530
},
"id": "qQ5duyCSWle1",
"outputId": "e15ca6a5-cfaf-496d-a5f0-d7497957833f",
"trusted": false
},
"cell_type": "code",
"source": "from sklearn.cluster import KMeans\nfig = plt.figure(figsize=(10,8))\nwcss= []\nfor i in range(1,10):\n clf= KMeans(n_clusters=i)\n clf.fit(df_norm)\n wcss.append(clf.inertia_)\nplt.plot(range(1,10),wcss)\nplt.title(\"The Elbow Method\")\nplt.xlabel(\"No of clusters\")\nplt.ylabel(\"wcss\")",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "Text(0, 0.5, 'wcss')"
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": "<Figure size 720x576 with 1 Axes>"
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "M9sUEDCQYJqD",
"outputId": "2db7be6f-060d-4035-e792-f525fad68ce5",
"trusted": false
},
"cell_type": "code",
"source": "clf = KMeans(n_clusters=4)\ny_kmeans = clf.fit_predict(df_norm) \ny_kmeans",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "array([2, 1, 1, 2, 1, 1, 3, 3, 1, 2, 3, 0, 1, 3, 0, 3, 0, 2, 0, 1, 3, 1,\n 0, 2, 3, 0, 0, 1, 0, 3, 1, 1, 2, 0, 3, 3, 3, 3, 3, 2, 0, 2, 1, 3,\n 0, 3, 3, 0, 0, 3], dtype=int32)"
},
"execution_count": 22,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "sf8xiImGYfIB",
"outputId": "f80f3f55-f978-441c-f0bc-d0a72ac9b383",
"trusted": false
},
"cell_type": "code",
"source": "clf.cluster_centers_",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "array([[0.1686747 , 0.11485774, 0.34028683, 0.12601868],\n [0.6124498 , 0.75 , 0.75423729, 0.67980189],\n [0.79141566, 0.6802226 , 0.36864407, 0.36466408],\n [0.30439405, 0.32937147, 0.70588235, 0.31098951]])"
},
"execution_count": 23,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "hx1KFqn-Ytjm",
"outputId": "85670cce-d6ec-4740-9eaa-bac902639abc",
"trusted": false
},
"cell_type": "code",
"source": "md= pd.Series(y_kmeans)\ndf['clust']=md\ndf",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-74fe6d4b-9396-4588-8e5d-50cd2f7e959a\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Unnamed: 0</th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n <th>clust</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>Alabama</td>\n <td>13.2</td>\n <td>236</td>\n <td>58</td>\n <td>21.2</td>\n <td>2</td>\n </tr>\n <tr>\n <th>1</th>\n <td>Alaska</td>\n <td>10.0</td>\n <td>263</td>\n <td>48</td>\n <td>44.5</td>\n <td>1</td>\n </tr>\n <tr>\n <th>2</th>\n <td>Arizona</td>\n <td>8.1</td>\n <td>294</td>\n <td>80</td>\n <td>31.0</td>\n <td>1</td>\n </tr>\n <tr>\n <th>3</th>\n <td>Arkansas</td>\n <td>8.8</td>\n <td>190</td>\n <td>50</td>\n <td>19.5</td>\n <td>2</td>\n </tr>\n <tr>\n <th>4</th>\n <td>California</td>\n <td>9.0</td>\n <td>276</td>\n <td>91</td>\n <td>40.6</td>\n <td>1</td>\n </tr>\n <tr>\n <th>5</th>\n <td>Colorado</td>\n <td>7.9</td>\n <td>204</td>\n <td>78</td>\n <td>38.7</td>\n <td>1</td>\n </tr>\n <tr>\n <th>6</th>\n <td>Connecticut</td>\n <td>3.3</td>\n <td>110</td>\n <td>77</td>\n <td>11.1</td>\n <td>3</td>\n </tr>\n <tr>\n <th>7</th>\n <td>Delaware</td>\n <td>5.9</td>\n <td>238</td>\n <td>72</td>\n <td>15.8</td>\n <td>3</td>\n </tr>\n <tr>\n <th>8</th>\n <td>Florida</td>\n <td>15.4</td>\n <td>335</td>\n <td>80</td>\n <td>31.9</td>\n <td>1</td>\n </tr>\n <tr>\n <th>9</th>\n <td>Georgia</td>\n <td>17.4</td>\n <td>211</td>\n <td>60</td>\n <td>25.8</td>\n <td>2</td>\n </tr>\n <tr>\n <th>10</th>\n <td>Hawaii</td>\n <td>5.3</td>\n <td>46</td>\n <td>83</td>\n <td>20.2</td>\n <td>3</td>\n </tr>\n <tr>\n <th>11</th>\n <td>Idaho</td>\n <td>2.6</td>\n <td>120</td>\n <td>54</td>\n <td>14.2</td>\n <td>0</td>\n </tr>\n <tr>\n <th>12</th>\n <td>Illinois</td>\n <td>10.4</td>\n <td>249</td>\n <td>83</td>\n <td>24.0</td>\n <td>1</td>\n </tr>\n <tr>\n <th>13</th>\n <td>Indiana</td>\n <td>7.2</td>\n <td>113</td>\n <td>65</td>\n <td>21.0</td>\n <td>3</td>\n </tr>\n <tr>\n <th>14</th>\n <td>Iowa</td>\n <td>2.2</td>\n <td>56</td>\n <td>57</td>\n <td>11.3</td>\n <td>0</td>\n </tr>\n <tr>\n <th>15</th>\n <td>Kansas</td>\n <td>6.0</td>\n <td>115</td>\n <td>66</td>\n <td>18.0</td>\n <td>3</td>\n </tr>\n <tr>\n <th>16</th>\n <td>Kentucky</td>\n <td>9.7</td>\n <td>109</td>\n <td>52</td>\n <td>16.3</td>\n <td>0</td>\n </tr>\n <tr>\n <th>17</th>\n <td>Louisiana</td>\n <td>15.4</td>\n <td>249</td>\n <td>66</td>\n <td>22.2</td>\n <td>2</td>\n </tr>\n <tr>\n <th>18</th>\n <td>Maine</td>\n <td>2.1</td>\n <td>83</td>\n <td>51</td>\n <td>7.8</td>\n <td>0</td>\n </tr>\n <tr>\n <th>19</th>\n <td>Maryland</td>\n <td>11.3</td>\n <td>300</td>\n <td>67</td>\n <td>27.8</td>\n <td>1</td>\n </tr>\n <tr>\n <th>20</th>\n <td>Massachusetts</td>\n <td>4.4</td>\n <td>149</td>\n <td>85</td>\n <td>16.3</td>\n <td>3</td>\n </tr>\n <tr>\n <th>21</th>\n <td>Michigan</td>\n <td>12.1</td>\n <td>255</td>\n <td>74</td>\n <td>35.1</td>\n <td>1</td>\n </tr>\n <tr>\n <th>22</th>\n <td>Minnesota</td>\n <td>2.7</td>\n <td>72</td>\n <td>66</td>\n <td>14.9</td>\n <td>0</td>\n </tr>\n <tr>\n <th>23</th>\n <td>Mississippi</td>\n <td>16.1</td>\n <td>259</td>\n <td>44</td>\n <td>17.1</td>\n <td>2</td>\n </tr>\n <tr>\n <th>24</th>\n <td>Missouri</td>\n <td>9.0</td>\n <td>178</td>\n <td>70</td>\n <td>28.2</td>\n <td>3</td>\n </tr>\n <tr>\n <th>25</th>\n <td>Montana</td>\n <td>6.0</td>\n <td>109</td>\n <td>53</td>\n <td>16.4</td>\n <td>0</td>\n </tr>\n <tr>\n <th>26</th>\n <td>Nebraska</td>\n <td>4.3</td>\n <td>102</td>\n <td>62</td>\n <td>16.5</td>\n <td>0</td>\n </tr>\n <tr>\n <th>27</th>\n <td>Nevada</td>\n <td>12.2</td>\n <td>252</td>\n <td>81</td>\n <td>46.0</td>\n <td>1</td>\n </tr>\n <tr>\n <th>28</th>\n <td>New Hampshire</td>\n <td>2.1</td>\n <td>57</td>\n <td>56</td>\n <td>9.5</td>\n <td>0</td>\n </tr>\n <tr>\n <th>29</th>\n <td>New Jersey</td>\n <td>7.4</td>\n <td>159</td>\n <td>89</td>\n <td>18.8</td>\n <td>3</td>\n </tr>\n <tr>\n <th>30</th>\n <td>New Mexico</td>\n <td>11.4</td>\n <td>285</td>\n <td>70</td>\n <td>32.1</td>\n <td>1</td>\n </tr>\n <tr>\n <th>31</th>\n <td>New York</td>\n <td>11.1</td>\n <td>254</td>\n <td>86</td>\n <td>26.1</td>\n <td>1</td>\n </tr>\n <tr>\n <th>32</th>\n <td>North Carolina</td>\n <td>13.0</td>\n <td>337</td>\n <td>45</td>\n <td>16.1</td>\n <td>2</td>\n </tr>\n <tr>\n <th>33</th>\n <td>North Dakota</td>\n <td>0.8</td>\n <td>45</td>\n <td>44</td>\n <td>7.3</td>\n <td>0</td>\n </tr>\n <tr>\n <th>34</th>\n <td>Ohio</td>\n <td>7.3</td>\n <td>120</td>\n <td>75</td>\n <td>21.4</td>\n <td>3</td>\n </tr>\n <tr>\n <th>35</th>\n <td>Oklahoma</td>\n <td>6.6</td>\n <td>151</td>\n <td>68</td>\n <td>20.0</td>\n <td>3</td>\n </tr>\n <tr>\n <th>36</th>\n <td>Oregon</td>\n <td>4.9</td>\n <td>159</td>\n <td>67</td>\n <td>29.3</td>\n <td>3</td>\n </tr>\n <tr>\n <th>37</th>\n <td>Pennsylvania</td>\n <td>6.3</td>\n <td>106</td>\n <td>72</td>\n <td>14.9</td>\n <td>3</td>\n </tr>\n <tr>\n <th>38</th>\n <td>Rhode Island</td>\n <td>3.4</td>\n <td>174</td>\n <td>87</td>\n <td>8.3</td>\n <td>3</td>\n </tr>\n <tr>\n <th>39</th>\n <td>South Carolina</td>\n <td>14.4</td>\n <td>279</td>\n <td>48</td>\n <td>22.5</td>\n <td>2</td>\n </tr>\n <tr>\n <th>40</th>\n <td>South Dakota</td>\n <td>3.8</td>\n <td>86</td>\n <td>45</td>\n <td>12.8</td>\n <td>0</td>\n </tr>\n <tr>\n <th>41</th>\n <td>Tennessee</td>\n <td>13.2</td>\n <td>188</td>\n <td>59</td>\n <td>26.9</td>\n <td>2</td>\n </tr>\n <tr>\n <th>42</th>\n <td>Texas</td>\n <td>12.7</td>\n <td>201</td>\n <td>80</td>\n <td>25.5</td>\n <td>1</td>\n </tr>\n <tr>\n <th>43</th>\n <td>Utah</td>\n <td>3.2</td>\n <td>120</td>\n <td>80</td>\n <td>22.9</td>\n <td>3</td>\n </tr>\n <tr>\n <th>44</th>\n <td>Vermont</td>\n <td>2.2</td>\n <td>48</td>\n <td>32</td>\n <td>11.2</td>\n <td>0</td>\n </tr>\n <tr>\n <th>45</th>\n <td>Virginia</td>\n <td>8.5</td>\n <td>156</td>\n <td>63</td>\n <td>20.7</td>\n <td>3</td>\n </tr>\n <tr>\n <th>46</th>\n <td>Washington</td>\n <td>4.0</td>\n <td>145</td>\n <td>73</td>\n <td>26.2</td>\n <td>3</td>\n </tr>\n <tr>\n <th>47</th>\n <td>West Virginia</td>\n <td>5.7</td>\n <td>81</td>\n <td>39</td>\n <td>9.3</td>\n <td>0</td>\n </tr>\n <tr>\n <th>48</th>\n <td>Wisconsin</td>\n <td>2.6</td>\n <td>53</td>\n <td>66</td>\n <td>10.8</td>\n <td>0</td>\n </tr>\n <tr>\n <th>49</th>\n <td>Wyoming</td>\n <td>6.8</td>\n <td>161</td>\n <td>60</td>\n <td>15.6</td>\n <td>3</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-74fe6d4b-9396-4588-8e5d-50cd2f7e959a')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-74fe6d4b-9396-4588-8e5d-50cd2f7e959a button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-74fe6d4b-9396-4588-8e5d-50cd2f7e959a');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Unnamed: 0 Murder Assault UrbanPop Rape clust\n0 Alabama 13.2 236 58 21.2 2\n1 Alaska 10.0 263 48 44.5 1\n2 Arizona 8.1 294 80 31.0 1\n3 Arkansas 8.8 190 50 19.5 2\n4 California 9.0 276 91 40.6 1\n5 Colorado 7.9 204 78 38.7 1\n6 Connecticut 3.3 110 77 11.1 3\n7 Delaware 5.9 238 72 15.8 3\n8 Florida 15.4 335 80 31.9 1\n9 Georgia 17.4 211 60 25.8 2\n10 Hawaii 5.3 46 83 20.2 3\n11 Idaho 2.6 120 54 14.2 0\n12 Illinois 10.4 249 83 24.0 1\n13 Indiana 7.2 113 65 21.0 3\n14 Iowa 2.2 56 57 11.3 0\n15 Kansas 6.0 115 66 18.0 3\n16 Kentucky 9.7 109 52 16.3 0\n17 Louisiana 15.4 249 66 22.2 2\n18 Maine 2.1 83 51 7.8 0\n19 Maryland 11.3 300 67 27.8 1\n20 Massachusetts 4.4 149 85 16.3 3\n21 Michigan 12.1 255 74 35.1 1\n22 Minnesota 2.7 72 66 14.9 0\n23 Mississippi 16.1 259 44 17.1 2\n24 Missouri 9.0 178 70 28.2 3\n25 Montana 6.0 109 53 16.4 0\n26 Nebraska 4.3 102 62 16.5 0\n27 Nevada 12.2 252 81 46.0 1\n28 New Hampshire 2.1 57 56 9.5 0\n29 New Jersey 7.4 159 89 18.8 3\n30 New Mexico 11.4 285 70 32.1 1\n31 New York 11.1 254 86 26.1 1\n32 North Carolina 13.0 337 45 16.1 2\n33 North Dakota 0.8 45 44 7.3 0\n34 Ohio 7.3 120 75 21.4 3\n35 Oklahoma 6.6 151 68 20.0 3\n36 Oregon 4.9 159 67 29.3 3\n37 Pennsylvania 6.3 106 72 14.9 3\n38 Rhode Island 3.4 174 87 8.3 3\n39 South Carolina 14.4 279 48 22.5 2\n40 South Dakota 3.8 86 45 12.8 0\n41 Tennessee 13.2 188 59 26.9 2\n42 Texas 12.7 201 80 25.5 1\n43 Utah 3.2 120 80 22.9 3\n44 Vermont 2.2 48 32 11.2 0\n45 Virginia 8.5 156 63 20.7 3\n46 Washington 4.0 145 73 26.2 3\n47 West Virginia 5.7 81 39 9.3 0\n48 Wisconsin 2.6 53 66 10.8 0\n49 Wyoming 6.8 161 60 15.6 3"
},
"execution_count": 24,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 206
},
"id": "U18h42DxZFLd",
"outputId": "64ef0fd4-b7e5-4c9b-cc29-e7c1e9253a9f",
"trusted": false
},
"cell_type": "code",
"source": "df.iloc[:,1:].groupby(df.clust).mean()",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-262129c3-0a22-4aaf-8273-32f996a4b3a2\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n <th>clust</th>\n </tr>\n <tr>\n <th>clust</th>\n <th></th>\n <th></th>\n <th></th>\n <th></th>\n <th></th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>3.600000</td>\n <td>78.538462</td>\n <td>52.076923</td>\n <td>12.176923</td>\n <td>0.0</td>\n </tr>\n <tr>\n <th>1</th>\n <td>10.966667</td>\n <td>264.000000</td>\n <td>76.500000</td>\n <td>33.608333</td>\n <td>1.0</td>\n </tr>\n <tr>\n <th>2</th>\n <td>13.937500</td>\n <td>243.625000</td>\n <td>53.750000</td>\n <td>21.412500</td>\n <td>2.0</td>\n </tr>\n <tr>\n <th>3</th>\n <td>5.852941</td>\n <td>141.176471</td>\n <td>73.647059</td>\n <td>19.335294</td>\n <td>3.0</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-262129c3-0a22-4aaf-8273-32f996a4b3a2')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-262129c3-0a22-4aaf-8273-32f996a4b3a2 button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-262129c3-0a22-4aaf-8273-32f996a4b3a2');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Murder Assault UrbanPop Rape clust\nclust \n0 3.600000 78.538462 52.076923 12.176923 0.0\n1 10.966667 264.000000 76.500000 33.608333 1.0\n2 13.937500 243.625000 53.750000 21.412500 2.0\n3 5.852941 141.176471 73.647059 19.335294 3.0"
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 287
},
"id": "BHFKFL8aZPJT",
"outputId": "9f8f2c00-1e9d-4967-fa33-c44e28554b12",
"trusted": false
},
"cell_type": "code",
"source": "df.plot(y=\"Rape\", x= \"UrbanPop\", c=clf.labels_ ,kind=\"scatter\",s=50,cmap=plt.cm.coolwarm)\nplt.title('Clusters using kmeans')",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "Text(0.5, 1.0, 'Clusters using kmeans')"
},
"execution_count": 27,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": "<Figure size 432x288 with 2 Axes>"
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
]
},
{
"metadata": {
"id": "uWTnCJpoazXH"
},
"cell_type": "markdown",
"source": "# DB Scan"
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "OL_6p3aGa2Sv",
"outputId": "cb1c4c37-eb6a-4c60-c68e-8a125fd5344c",
"trusted": false
},
"cell_type": "code",
"source": "from sklearn.cluster import DBSCAN\nfrom sklearn.preprocessing import StandardScaler\nscan = pd.read_csv(\"crime_data.csv\")\nscan",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-e7ee7e4a-4bb5-436b-957d-b4f55fb357e1\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Unnamed: 0</th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>Alabama</td>\n <td>13.2</td>\n <td>236</td>\n <td>58</td>\n <td>21.2</td>\n </tr>\n <tr>\n <th>1</th>\n <td>Alaska</td>\n <td>10.0</td>\n <td>263</td>\n <td>48</td>\n <td>44.5</td>\n </tr>\n <tr>\n <th>2</th>\n <td>Arizona</td>\n <td>8.1</td>\n <td>294</td>\n <td>80</td>\n <td>31.0</td>\n </tr>\n <tr>\n <th>3</th>\n <td>Arkansas</td>\n <td>8.8</td>\n <td>190</td>\n <td>50</td>\n <td>19.5</td>\n </tr>\n <tr>\n <th>4</th>\n <td>California</td>\n <td>9.0</td>\n <td>276</td>\n <td>91</td>\n <td>40.6</td>\n </tr>\n <tr>\n <th>5</th>\n <td>Colorado</td>\n <td>7.9</td>\n <td>204</td>\n <td>78</td>\n <td>38.7</td>\n </tr>\n <tr>\n <th>6</th>\n <td>Connecticut</td>\n <td>3.3</td>\n <td>110</td>\n <td>77</td>\n <td>11.1</td>\n </tr>\n <tr>\n <th>7</th>\n <td>Delaware</td>\n <td>5.9</td>\n <td>238</td>\n <td>72</td>\n <td>15.8</td>\n </tr>\n <tr>\n <th>8</th>\n <td>Florida</td>\n <td>15.4</td>\n <td>335</td>\n <td>80</td>\n <td>31.9</td>\n </tr>\n <tr>\n <th>9</th>\n <td>Georgia</td>\n <td>17.4</td>\n <td>211</td>\n <td>60</td>\n <td>25.8</td>\n </tr>\n <tr>\n <th>10</th>\n <td>Hawaii</td>\n <td>5.3</td>\n <td>46</td>\n <td>83</td>\n <td>20.2</td>\n </tr>\n <tr>\n <th>11</th>\n <td>Idaho</td>\n <td>2.6</td>\n <td>120</td>\n <td>54</td>\n <td>14.2</td>\n </tr>\n <tr>\n <th>12</th>\n <td>Illinois</td>\n <td>10.4</td>\n <td>249</td>\n <td>83</td>\n <td>24.0</td>\n </tr>\n <tr>\n <th>13</th>\n <td>Indiana</td>\n <td>7.2</td>\n <td>113</td>\n <td>65</td>\n <td>21.0</td>\n </tr>\n <tr>\n <th>14</th>\n <td>Iowa</td>\n <td>2.2</td>\n <td>56</td>\n <td>57</td>\n <td>11.3</td>\n </tr>\n <tr>\n <th>15</th>\n <td>Kansas</td>\n <td>6.0</td>\n <td>115</td>\n <td>66</td>\n <td>18.0</td>\n </tr>\n <tr>\n <th>16</th>\n <td>Kentucky</td>\n <td>9.7</td>\n <td>109</td>\n <td>52</td>\n <td>16.3</td>\n </tr>\n <tr>\n <th>17</th>\n <td>Louisiana</td>\n <td>15.4</td>\n <td>249</td>\n <td>66</td>\n <td>22.2</td>\n </tr>\n <tr>\n <th>18</th>\n <td>Maine</td>\n <td>2.1</td>\n <td>83</td>\n <td>51</td>\n <td>7.8</td>\n </tr>\n <tr>\n <th>19</th>\n <td>Maryland</td>\n <td>11.3</td>\n <td>300</td>\n <td>67</td>\n <td>27.8</td>\n </tr>\n <tr>\n <th>20</th>\n <td>Massachusetts</td>\n <td>4.4</td>\n <td>149</td>\n <td>85</td>\n <td>16.3</td>\n </tr>\n <tr>\n <th>21</th>\n <td>Michigan</td>\n <td>12.1</td>\n <td>255</td>\n <td>74</td>\n <td>35.1</td>\n </tr>\n <tr>\n <th>22</th>\n <td>Minnesota</td>\n <td>2.7</td>\n <td>72</td>\n <td>66</td>\n <td>14.9</td>\n </tr>\n <tr>\n <th>23</th>\n <td>Mississippi</td>\n <td>16.1</td>\n <td>259</td>\n <td>44</td>\n <td>17.1</td>\n </tr>\n <tr>\n <th>24</th>\n <td>Missouri</td>\n <td>9.0</td>\n <td>178</td>\n <td>70</td>\n <td>28.2</td>\n </tr>\n <tr>\n <th>25</th>\n <td>Montana</td>\n <td>6.0</td>\n <td>109</td>\n <td>53</td>\n <td>16.4</td>\n </tr>\n <tr>\n <th>26</th>\n <td>Nebraska</td>\n <td>4.3</td>\n <td>102</td>\n <td>62</td>\n <td>16.5</td>\n </tr>\n <tr>\n <th>27</th>\n <td>Nevada</td>\n <td>12.2</td>\n <td>252</td>\n <td>81</td>\n <td>46.0</td>\n </tr>\n <tr>\n <th>28</th>\n <td>New Hampshire</td>\n <td>2.1</td>\n <td>57</td>\n <td>56</td>\n <td>9.5</td>\n </tr>\n <tr>\n <th>29</th>\n <td>New Jersey</td>\n <td>7.4</td>\n <td>159</td>\n <td>89</td>\n <td>18.8</td>\n </tr>\n <tr>\n <th>30</th>\n <td>New Mexico</td>\n <td>11.4</td>\n <td>285</td>\n <td>70</td>\n <td>32.1</td>\n </tr>\n <tr>\n <th>31</th>\n <td>New York</td>\n <td>11.1</td>\n <td>254</td>\n <td>86</td>\n <td>26.1</td>\n </tr>\n <tr>\n <th>32</th>\n <td>North Carolina</td>\n <td>13.0</td>\n <td>337</td>\n <td>45</td>\n <td>16.1</td>\n </tr>\n <tr>\n <th>33</th>\n <td>North Dakota</td>\n <td>0.8</td>\n <td>45</td>\n <td>44</td>\n <td>7.3</td>\n </tr>\n <tr>\n <th>34</th>\n <td>Ohio</td>\n <td>7.3</td>\n <td>120</td>\n <td>75</td>\n <td>21.4</td>\n </tr>\n <tr>\n <th>35</th>\n <td>Oklahoma</td>\n <td>6.6</td>\n <td>151</td>\n <td>68</td>\n <td>20.0</td>\n </tr>\n <tr>\n <th>36</th>\n <td>Oregon</td>\n <td>4.9</td>\n <td>159</td>\n <td>67</td>\n <td>29.3</td>\n </tr>\n <tr>\n <th>37</th>\n <td>Pennsylvania</td>\n <td>6.3</td>\n <td>106</td>\n <td>72</td>\n <td>14.9</td>\n </tr>\n <tr>\n <th>38</th>\n <td>Rhode Island</td>\n <td>3.4</td>\n <td>174</td>\n <td>87</td>\n <td>8.3</td>\n </tr>\n <tr>\n <th>39</th>\n <td>South Carolina</td>\n <td>14.4</td>\n <td>279</td>\n <td>48</td>\n <td>22.5</td>\n </tr>\n <tr>\n <th>40</th>\n <td>South Dakota</td>\n <td>3.8</td>\n <td>86</td>\n <td>45</td>\n <td>12.8</td>\n </tr>\n <tr>\n <th>41</th>\n <td>Tennessee</td>\n <td>13.2</td>\n <td>188</td>\n <td>59</td>\n <td>26.9</td>\n </tr>\n <tr>\n <th>42</th>\n <td>Texas</td>\n <td>12.7</td>\n <td>201</td>\n <td>80</td>\n <td>25.5</td>\n </tr>\n <tr>\n <th>43</th>\n <td>Utah</td>\n <td>3.2</td>\n <td>120</td>\n <td>80</td>\n <td>22.9</td>\n </tr>\n <tr>\n <th>44</th>\n <td>Vermont</td>\n <td>2.2</td>\n <td>48</td>\n <td>32</td>\n <td>11.2</td>\n </tr>\n <tr>\n <th>45</th>\n <td>Virginia</td>\n <td>8.5</td>\n <td>156</td>\n <td>63</td>\n <td>20.7</td>\n </tr>\n <tr>\n <th>46</th>\n <td>Washington</td>\n <td>4.0</td>\n <td>145</td>\n <td>73</td>\n <td>26.2</td>\n </tr>\n <tr>\n <th>47</th>\n <td>West Virginia</td>\n <td>5.7</td>\n <td>81</td>\n <td>39</td>\n <td>9.3</td>\n </tr>\n <tr>\n <th>48</th>\n <td>Wisconsin</td>\n <td>2.6</td>\n <td>53</td>\n <td>66</td>\n <td>10.8</td>\n </tr>\n <tr>\n <th>49</th>\n <td>Wyoming</td>\n <td>6.8</td>\n <td>161</td>\n <td>60</td>\n <td>15.6</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-e7ee7e4a-4bb5-436b-957d-b4f55fb357e1')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-e7ee7e4a-4bb5-436b-957d-b4f55fb357e1 button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-e7ee7e4a-4bb5-436b-957d-b4f55fb357e1');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Unnamed: 0 Murder Assault UrbanPop Rape\n0 Alabama 13.2 236 58 21.2\n1 Alaska 10.0 263 48 44.5\n2 Arizona 8.1 294 80 31.0\n3 Arkansas 8.8 190 50 19.5\n4 California 9.0 276 91 40.6\n5 Colorado 7.9 204 78 38.7\n6 Connecticut 3.3 110 77 11.1\n7 Delaware 5.9 238 72 15.8\n8 Florida 15.4 335 80 31.9\n9 Georgia 17.4 211 60 25.8\n10 Hawaii 5.3 46 83 20.2\n11 Idaho 2.6 120 54 14.2\n12 Illinois 10.4 249 83 24.0\n13 Indiana 7.2 113 65 21.0\n14 Iowa 2.2 56 57 11.3\n15 Kansas 6.0 115 66 18.0\n16 Kentucky 9.7 109 52 16.3\n17 Louisiana 15.4 249 66 22.2\n18 Maine 2.1 83 51 7.8\n19 Maryland 11.3 300 67 27.8\n20 Massachusetts 4.4 149 85 16.3\n21 Michigan 12.1 255 74 35.1\n22 Minnesota 2.7 72 66 14.9\n23 Mississippi 16.1 259 44 17.1\n24 Missouri 9.0 178 70 28.2\n25 Montana 6.0 109 53 16.4\n26 Nebraska 4.3 102 62 16.5\n27 Nevada 12.2 252 81 46.0\n28 New Hampshire 2.1 57 56 9.5\n29 New Jersey 7.4 159 89 18.8\n30 New Mexico 11.4 285 70 32.1\n31 New York 11.1 254 86 26.1\n32 North Carolina 13.0 337 45 16.1\n33 North Dakota 0.8 45 44 7.3\n34 Ohio 7.3 120 75 21.4\n35 Oklahoma 6.6 151 68 20.0\n36 Oregon 4.9 159 67 29.3\n37 Pennsylvania 6.3 106 72 14.9\n38 Rhode Island 3.4 174 87 8.3\n39 South Carolina 14.4 279 48 22.5\n40 South Dakota 3.8 86 45 12.8\n41 Tennessee 13.2 188 59 26.9\n42 Texas 12.7 201 80 25.5\n43 Utah 3.2 120 80 22.9\n44 Vermont 2.2 48 32 11.2\n45 Virginia 8.5 156 63 20.7\n46 Washington 4.0 145 73 26.2\n47 West Virginia 5.7 81 39 9.3\n48 Wisconsin 2.6 53 66 10.8\n49 Wyoming 6.8 161 60 15.6"
},
"execution_count": 40,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "aE5EGnOfd5GG",
"outputId": "c60e63f7-de6e-479b-b33a-5dd1ab668667",
"trusted": false
},
"cell_type": "code",
"source": "scan.info()",
"execution_count": null,
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": "<class 'pandas.core.frame.DataFrame'>\nRangeIndex: 50 entries, 0 to 49\nData columns (total 5 columns):\n # Column Non-Null Count Dtype \n--- ------ -------------- ----- \n 0 Unnamed: 0 50 non-null object \n 1 Murder 50 non-null float64\n 2 Assault 50 non-null int64 \n 3 UrbanPop 50 non-null int64 \n 4 Rape 50 non-null float64\ndtypes: float64(2), int64(2), object(1)\nmemory usage: 2.1+ KB\n"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "dl3Z2FM0bse7",
"outputId": "fc746afe-4e22-4290-d7ae-eec06c5f029d",
"trusted": false
},
"cell_type": "code",
"source": "scan1 = scan.drop(['Unnamed: 0'],axis=1)\nscan1",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-b0ff6977-0c28-4cc6-a93f-bc0488b0e950\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>13.2</td>\n <td>236</td>\n <td>58</td>\n <td>21.2</td>\n </tr>\n <tr>\n <th>1</th>\n <td>10.0</td>\n <td>263</td>\n <td>48</td>\n <td>44.5</td>\n </tr>\n <tr>\n <th>2</th>\n <td>8.1</td>\n <td>294</td>\n <td>80</td>\n <td>31.0</td>\n </tr>\n <tr>\n <th>3</th>\n <td>8.8</td>\n <td>190</td>\n <td>50</td>\n <td>19.5</td>\n </tr>\n <tr>\n <th>4</th>\n <td>9.0</td>\n <td>276</td>\n <td>91</td>\n <td>40.6</td>\n </tr>\n <tr>\n <th>5</th>\n <td>7.9</td>\n <td>204</td>\n <td>78</td>\n <td>38.7</td>\n </tr>\n <tr>\n <th>6</th>\n <td>3.3</td>\n <td>110</td>\n <td>77</td>\n <td>11.1</td>\n </tr>\n <tr>\n <th>7</th>\n <td>5.9</td>\n <td>238</td>\n <td>72</td>\n <td>15.8</td>\n </tr>\n <tr>\n <th>8</th>\n <td>15.4</td>\n <td>335</td>\n <td>80</td>\n <td>31.9</td>\n </tr>\n <tr>\n <th>9</th>\n <td>17.4</td>\n <td>211</td>\n <td>60</td>\n <td>25.8</td>\n </tr>\n <tr>\n <th>10</th>\n <td>5.3</td>\n <td>46</td>\n <td>83</td>\n <td>20.2</td>\n </tr>\n <tr>\n <th>11</th>\n <td>2.6</td>\n <td>120</td>\n <td>54</td>\n <td>14.2</td>\n </tr>\n <tr>\n <th>12</th>\n <td>10.4</td>\n <td>249</td>\n <td>83</td>\n <td>24.0</td>\n </tr>\n <tr>\n <th>13</th>\n <td>7.2</td>\n <td>113</td>\n <td>65</td>\n <td>21.0</td>\n </tr>\n <tr>\n <th>14</th>\n <td>2.2</td>\n <td>56</td>\n <td>57</td>\n <td>11.3</td>\n </tr>\n <tr>\n <th>15</th>\n <td>6.0</td>\n <td>115</td>\n <td>66</td>\n <td>18.0</td>\n </tr>\n <tr>\n <th>16</th>\n <td>9.7</td>\n <td>109</td>\n <td>52</td>\n <td>16.3</td>\n </tr>\n <tr>\n <th>17</th>\n <td>15.4</td>\n <td>249</td>\n <td>66</td>\n <td>22.2</td>\n </tr>\n <tr>\n <th>18</th>\n <td>2.1</td>\n <td>83</td>\n <td>51</td>\n <td>7.8</td>\n </tr>\n <tr>\n <th>19</th>\n <td>11.3</td>\n <td>300</td>\n <td>67</td>\n <td>27.8</td>\n </tr>\n <tr>\n <th>20</th>\n <td>4.4</td>\n <td>149</td>\n <td>85</td>\n <td>16.3</td>\n </tr>\n <tr>\n <th>21</th>\n <td>12.1</td>\n <td>255</td>\n <td>74</td>\n <td>35.1</td>\n </tr>\n <tr>\n <th>22</th>\n <td>2.7</td>\n <td>72</td>\n <td>66</td>\n <td>14.9</td>\n </tr>\n <tr>\n <th>23</th>\n <td>16.1</td>\n <td>259</td>\n <td>44</td>\n <td>17.1</td>\n </tr>\n <tr>\n <th>24</th>\n <td>9.0</td>\n <td>178</td>\n <td>70</td>\n <td>28.2</td>\n </tr>\n <tr>\n <th>25</th>\n <td>6.0</td>\n <td>109</td>\n <td>53</td>\n <td>16.4</td>\n </tr>\n <tr>\n <th>26</th>\n <td>4.3</td>\n <td>102</td>\n <td>62</td>\n <td>16.5</td>\n </tr>\n <tr>\n <th>27</th>\n <td>12.2</td>\n <td>252</td>\n <td>81</td>\n <td>46.0</td>\n </tr>\n <tr>\n <th>28</th>\n <td>2.1</td>\n <td>57</td>\n <td>56</td>\n <td>9.5</td>\n </tr>\n <tr>\n <th>29</th>\n <td>7.4</td>\n <td>159</td>\n <td>89</td>\n <td>18.8</td>\n </tr>\n <tr>\n <th>30</th>\n <td>11.4</td>\n <td>285</td>\n <td>70</td>\n <td>32.1</td>\n </tr>\n <tr>\n <th>31</th>\n <td>11.1</td>\n <td>254</td>\n <td>86</td>\n <td>26.1</td>\n </tr>\n <tr>\n <th>32</th>\n <td>13.0</td>\n <td>337</td>\n <td>45</td>\n <td>16.1</td>\n </tr>\n <tr>\n <th>33</th>\n <td>0.8</td>\n <td>45</td>\n <td>44</td>\n <td>7.3</td>\n </tr>\n <tr>\n <th>34</th>\n <td>7.3</td>\n <td>120</td>\n <td>75</td>\n <td>21.4</td>\n </tr>\n <tr>\n <th>35</th>\n <td>6.6</td>\n <td>151</td>\n <td>68</td>\n <td>20.0</td>\n </tr>\n <tr>\n <th>36</th>\n <td>4.9</td>\n <td>159</td>\n <td>67</td>\n <td>29.3</td>\n </tr>\n <tr>\n <th>37</th>\n <td>6.3</td>\n <td>106</td>\n <td>72</td>\n <td>14.9</td>\n </tr>\n <tr>\n <th>38</th>\n <td>3.4</td>\n <td>174</td>\n <td>87</td>\n <td>8.3</td>\n </tr>\n <tr>\n <th>39</th>\n <td>14.4</td>\n <td>279</td>\n <td>48</td>\n <td>22.5</td>\n </tr>\n <tr>\n <th>40</th>\n <td>3.8</td>\n <td>86</td>\n <td>45</td>\n <td>12.8</td>\n </tr>\n <tr>\n <th>41</th>\n <td>13.2</td>\n <td>188</td>\n <td>59</td>\n <td>26.9</td>\n </tr>\n <tr>\n <th>42</th>\n <td>12.7</td>\n <td>201</td>\n <td>80</td>\n <td>25.5</td>\n </tr>\n <tr>\n <th>43</th>\n <td>3.2</td>\n <td>120</td>\n <td>80</td>\n <td>22.9</td>\n </tr>\n <tr>\n <th>44</th>\n <td>2.2</td>\n <td>48</td>\n <td>32</td>\n <td>11.2</td>\n </tr>\n <tr>\n <th>45</th>\n <td>8.5</td>\n <td>156</td>\n <td>63</td>\n <td>20.7</td>\n </tr>\n <tr>\n <th>46</th>\n <td>4.0</td>\n <td>145</td>\n <td>73</td>\n <td>26.2</td>\n </tr>\n <tr>\n <th>47</th>\n <td>5.7</td>\n <td>81</td>\n <td>39</td>\n <td>9.3</td>\n </tr>\n <tr>\n <th>48</th>\n <td>2.6</td>\n <td>53</td>\n <td>66</td>\n <td>10.8</td>\n </tr>\n <tr>\n <th>49</th>\n <td>6.8</td>\n <td>161</td>\n <td>60</td>\n <td>15.6</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-b0ff6977-0c28-4cc6-a93f-bc0488b0e950')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-b0ff6977-0c28-4cc6-a93f-bc0488b0e950 button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-b0ff6977-0c28-4cc6-a93f-bc0488b0e950');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Murder Assault UrbanPop Rape\n0 13.2 236 58 21.2\n1 10.0 263 48 44.5\n2 8.1 294 80 31.0\n3 8.8 190 50 19.5\n4 9.0 276 91 40.6\n5 7.9 204 78 38.7\n6 3.3 110 77 11.1\n7 5.9 238 72 15.8\n8 15.4 335 80 31.9\n9 17.4 211 60 25.8\n10 5.3 46 83 20.2\n11 2.6 120 54 14.2\n12 10.4 249 83 24.0\n13 7.2 113 65 21.0\n14 2.2 56 57 11.3\n15 6.0 115 66 18.0\n16 9.7 109 52 16.3\n17 15.4 249 66 22.2\n18 2.1 83 51 7.8\n19 11.3 300 67 27.8\n20 4.4 149 85 16.3\n21 12.1 255 74 35.1\n22 2.7 72 66 14.9\n23 16.1 259 44 17.1\n24 9.0 178 70 28.2\n25 6.0 109 53 16.4\n26 4.3 102 62 16.5\n27 12.2 252 81 46.0\n28 2.1 57 56 9.5\n29 7.4 159 89 18.8\n30 11.4 285 70 32.1\n31 11.1 254 86 26.1\n32 13.0 337 45 16.1\n33 0.8 45 44 7.3\n34 7.3 120 75 21.4\n35 6.6 151 68 20.0\n36 4.9 159 67 29.3\n37 6.3 106 72 14.9\n38 3.4 174 87 8.3\n39 14.4 279 48 22.5\n40 3.8 86 45 12.8\n41 13.2 188 59 26.9\n42 12.7 201 80 25.5\n43 3.2 120 80 22.9\n44 2.2 48 32 11.2\n45 8.5 156 63 20.7\n46 4.0 145 73 26.2\n47 5.7 81 39 9.3\n48 2.6 53 66 10.8\n49 6.8 161 60 15.6"
},
"execution_count": 42,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "tLze3K89eHc8",
"outputId": "52c24132-d545-4341-fc9b-82752f975089",
"trusted": false
},
"cell_type": "code",
"source": "array = scan1.values \narray ",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "array([[ 13.2, 236. , 58. , 21.2],\n [ 10. , 263. , 48. , 44.5],\n [ 8.1, 294. , 80. , 31. ],\n [ 8.8, 190. , 50. , 19.5],\n [ 9. , 276. , 91. , 40.6],\n [ 7.9, 204. , 78. , 38.7],\n [ 3.3, 110. , 77. , 11.1],\n [ 5.9, 238. , 72. , 15.8],\n [ 15.4, 335. , 80. , 31.9],\n [ 17.4, 211. , 60. , 25.8],\n [ 5.3, 46. , 83. , 20.2],\n [ 2.6, 120. , 54. , 14.2],\n [ 10.4, 249. , 83. , 24. ],\n [ 7.2, 113. , 65. , 21. ],\n [ 2.2, 56. , 57. , 11.3],\n [ 6. , 115. , 66. , 18. ],\n [ 9.7, 109. , 52. , 16.3],\n [ 15.4, 249. , 66. , 22.2],\n [ 2.1, 83. , 51. , 7.8],\n [ 11.3, 300. , 67. , 27.8],\n [ 4.4, 149. , 85. , 16.3],\n [ 12.1, 255. , 74. , 35.1],\n [ 2.7, 72. , 66. , 14.9],\n [ 16.1, 259. , 44. , 17.1],\n [ 9. , 178. , 70. , 28.2],\n [ 6. , 109. , 53. , 16.4],\n [ 4.3, 102. , 62. , 16.5],\n [ 12.2, 252. , 81. , 46. ],\n [ 2.1, 57. , 56. , 9.5],\n [ 7.4, 159. , 89. , 18.8],\n [ 11.4, 285. , 70. , 32.1],\n [ 11.1, 254. , 86. , 26.1],\n [ 13. , 337. , 45. , 16.1],\n [ 0.8, 45. , 44. , 7.3],\n [ 7.3, 120. , 75. , 21.4],\n [ 6.6, 151. , 68. , 20. ],\n [ 4.9, 159. , 67. , 29.3],\n [ 6.3, 106. , 72. , 14.9],\n [ 3.4, 174. , 87. , 8.3],\n [ 14.4, 279. , 48. , 22.5],\n [ 3.8, 86. , 45. , 12.8],\n [ 13.2, 188. , 59. , 26.9],\n [ 12.7, 201. , 80. , 25.5],\n [ 3.2, 120. , 80. , 22.9],\n [ 2.2, 48. , 32. , 11.2],\n [ 8.5, 156. , 63. , 20.7],\n [ 4. , 145. , 73. , 26.2],\n [ 5.7, 81. , 39. , 9.3],\n [ 2.6, 53. , 66. , 10.8],\n [ 6.8, 161. , 60. , 15.6]])"
},
"execution_count": 43,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "te34uXBseRnU",
"outputId": "f3b254bf-b0f9-4798-b650-f0d6a51c53fc",
"trusted": false
},
"cell_type": "code",
"source": "stdscal = StandardScaler().fit(array)\nx = stdscal.transform(array)\nx",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "array([[ 1.25517927, 0.79078716, -0.52619514, -0.00345116],\n [ 0.51301858, 1.11805959, -1.22406668, 2.50942392],\n [ 0.07236067, 1.49381682, 1.00912225, 1.05346626],\n [ 0.23470832, 0.23321191, -1.08449238, -0.18679398],\n [ 0.28109336, 1.2756352 , 1.77678094, 2.08881393],\n [ 0.02597562, 0.40290872, 0.86954794, 1.88390137],\n [-1.04088037, -0.73648418, 0.79976079, -1.09272319],\n [-0.43787481, 0.81502956, 0.45082502, -0.58583422],\n [ 1.76541475, 1.99078607, 1.00912225, 1.1505301 ],\n [ 2.22926518, 0.48775713, -0.38662083, 0.49265293],\n [-0.57702994, -1.51224105, 1.21848371, -0.11129987],\n [-1.20322802, -0.61527217, -0.80534376, -0.75839217],\n [ 0.60578867, 0.94836277, 1.21848371, 0.29852525],\n [-0.13637203, -0.70012057, -0.03768506, -0.0250209 ],\n [-1.29599811, -1.39102904, -0.5959823 , -1.07115345],\n [-0.41468229, -0.67587817, 0.03210209, -0.34856705],\n [ 0.44344101, -0.74860538, -0.94491807, -0.53190987],\n [ 1.76541475, 0.94836277, 0.03210209, 0.10439756],\n [-1.31919063, -1.06375661, -1.01470522, -1.44862395],\n [ 0.81452136, 1.56654403, 0.10188925, 0.70835037],\n [-0.78576263, -0.26375734, 1.35805802, -0.53190987],\n [ 1.00006153, 1.02108998, 0.59039932, 1.49564599],\n [-1.1800355 , -1.19708982, 0.03210209, -0.68289807],\n [ 1.9277624 , 1.06957478, -1.5032153 , -0.44563089],\n [ 0.28109336, 0.0877575 , 0.31125071, 0.75148985],\n [-0.41468229, -0.74860538, -0.87513091, -0.521125 ],\n [-0.80895515, -0.83345379, -0.24704653, -0.51034012],\n [ 1.02325405, 0.98472638, 1.0789094 , 2.671197 ],\n [-1.31919063, -1.37890783, -0.66576945, -1.26528114],\n [-0.08998698, -0.14254532, 1.63720664, -0.26228808],\n [ 0.83771388, 1.38472601, 0.31125071, 1.17209984],\n [ 0.76813632, 1.00896878, 1.42784517, 0.52500755],\n [ 1.20879423, 2.01502847, -1.43342815, -0.55347961],\n [-1.62069341, -1.52436225, -1.5032153 , -1.50254831],\n [-0.11317951, -0.61527217, 0.66018648, 0.01811858],\n [-0.27552716, -0.23951493, 0.1716764 , -0.13286962],\n [-0.66980002, -0.14254532, 0.10188925, 0.87012344],\n [-0.34510472, -0.78496898, 0.45082502, -0.68289807],\n [-1.01768785, 0.03927269, 1.49763233, -1.39469959],\n [ 1.53348953, 1.3119988 , -1.22406668, 0.13675217],\n [-0.92491776, -1.027393 , -1.43342815, -0.90938037],\n [ 1.25517927, 0.20896951, -0.45640799, 0.61128652],\n [ 1.13921666, 0.36654512, 1.00912225, 0.46029832],\n [-1.06407289, -0.61527217, 1.00912225, 0.17989166],\n [-1.29599811, -1.48799864, -2.34066115, -1.08193832],\n [ 0.16513075, -0.17890893, -0.17725937, -0.05737552],\n [-0.87853272, -0.31224214, 0.52061217, 0.53579242],\n [-0.48425985, -1.08799901, -1.85215107, -1.28685088],\n [-1.20322802, -1.42739264, 0.03210209, -1.1250778 ],\n [-0.22914211, -0.11830292, -0.38662083, -0.60740397]])"
},
"execution_count": 45,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 282
},
"id": "V4FIKtCFex3b",
"outputId": "60379584-cec2-4c46-e64e-5afad57d8967",
"trusted": false
},
"cell_type": "code",
"source": "from sklearn.neighbors import NearestNeighbors\nneigh = NearestNeighbors(n_neighbors=8) #2n = 2*No of columns \nnbrs = neigh.fit(x)\ndistances , indices = nbrs.kneighbors(x)\ndistances = np.sort(distances, axis=0)\ndistances = distances[:,1]\nplt.plot(distances) ",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "[<matplotlib.lines.Line2D at 0x7f3fba81b2d0>]"
},
"execution_count": 48,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": "<Figure size 432x288 with 1 Axes>"
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "ytr8tqkLgsTO",
"outputId": "8442af08-f90e-42fa-9014-14e996488df1",
"trusted": false
},
"cell_type": "code",
"source": "dbscan = DBSCAN(eps=1.25, min_samples=5)\ndbscan.fit(x)\ndbscan.labels_ ",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "array([ 0, -1, 1, 2, -1, 1, 2, 2, -1, 0, 2, 2, 1, 2, 2, 2, 2,\n 0, 2, 1, 2, 1, 2, -1, 2, 2, 2, -1, 2, 2, 1, 1, -1, 2,\n 2, 2, 2, 2, 2, 0, 2, 0, 2, 2, 2, 2, 2, 2, 2, 2])"
},
"execution_count": 58,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "TqcR7hJeh_wJ",
"outputId": "ba519157-22c7-4e32-e83c-d551026476e4",
"trusted": false
},
"cell_type": "code",
"source": "cl=pd.DataFrame(dbscan.labels_,columns=['cluster']) \npd.set_option(\"display.max_rows\", None) \ncl",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-7ba4a237-b2e7-43a1-93f7-8615b94b8983\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>cluster</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>0</td>\n </tr>\n <tr>\n <th>1</th>\n <td>-1</td>\n </tr>\n <tr>\n <th>2</th>\n <td>1</td>\n </tr>\n <tr>\n <th>3</th>\n <td>2</td>\n </tr>\n <tr>\n <th>4</th>\n <td>-1</td>\n </tr>\n <tr>\n <th>5</th>\n <td>1</td>\n </tr>\n <tr>\n <th>6</th>\n <td>2</td>\n </tr>\n <tr>\n <th>7</th>\n <td>2</td>\n </tr>\n <tr>\n <th>8</th>\n <td>-1</td>\n </tr>\n <tr>\n <th>9</th>\n <td>0</td>\n </tr>\n <tr>\n <th>10</th>\n <td>2</td>\n </tr>\n <tr>\n <th>11</th>\n <td>2</td>\n </tr>\n <tr>\n <th>12</th>\n <td>1</td>\n </tr>\n <tr>\n <th>13</th>\n <td>2</td>\n </tr>\n <tr>\n <th>14</th>\n <td>2</td>\n </tr>\n <tr>\n <th>15</th>\n <td>2</td>\n </tr>\n <tr>\n <th>16</th>\n <td>2</td>\n </tr>\n <tr>\n <th>17</th>\n <td>0</td>\n </tr>\n <tr>\n <th>18</th>\n <td>2</td>\n </tr>\n <tr>\n <th>19</th>\n <td>1</td>\n </tr>\n <tr>\n <th>20</th>\n <td>2</td>\n </tr>\n <tr>\n <th>21</th>\n <td>1</td>\n </tr>\n <tr>\n <th>22</th>\n <td>2</td>\n </tr>\n <tr>\n <th>23</th>\n <td>-1</td>\n </tr>\n <tr>\n <th>24</th>\n <td>2</td>\n </tr>\n <tr>\n <th>25</th>\n <td>2</td>\n </tr>\n <tr>\n <th>26</th>\n <td>2</td>\n </tr>\n <tr>\n <th>27</th>\n <td>-1</td>\n </tr>\n <tr>\n <th>28</th>\n <td>2</td>\n </tr>\n <tr>\n <th>29</th>\n <td>2</td>\n </tr>\n <tr>\n <th>30</th>\n <td>1</td>\n </tr>\n <tr>\n <th>31</th>\n <td>1</td>\n </tr>\n <tr>\n <th>32</th>\n <td>-1</td>\n </tr>\n <tr>\n <th>33</th>\n <td>2</td>\n </tr>\n <tr>\n <th>34</th>\n <td>2</td>\n </tr>\n <tr>\n <th>35</th>\n <td>2</td>\n </tr>\n <tr>\n <th>36</th>\n <td>2</td>\n </tr>\n <tr>\n <th>37</th>\n <td>2</td>\n </tr>\n <tr>\n <th>38</th>\n <td>2</td>\n </tr>\n <tr>\n <th>39</th>\n <td>0</td>\n </tr>\n <tr>\n <th>40</th>\n <td>2</td>\n </tr>\n <tr>\n <th>41</th>\n <td>0</td>\n </tr>\n <tr>\n <th>42</th>\n <td>2</td>\n </tr>\n <tr>\n <th>43</th>\n <td>2</td>\n </tr>\n <tr>\n <th>44</th>\n <td>2</td>\n </tr>\n <tr>\n <th>45</th>\n <td>2</td>\n </tr>\n <tr>\n <th>46</th>\n <td>2</td>\n </tr>\n <tr>\n <th>47</th>\n <td>2</td>\n </tr>\n <tr>\n <th>48</th>\n <td>2</td>\n </tr>\n <tr>\n <th>49</th>\n <td>2</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-7ba4a237-b2e7-43a1-93f7-8615b94b8983')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-7ba4a237-b2e7-43a1-93f7-8615b94b8983 button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-7ba4a237-b2e7-43a1-93f7-8615b94b8983');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " cluster\n0 0\n1 -1\n2 1\n3 2\n4 -1\n5 1\n6 2\n7 2\n8 -1\n9 0\n10 2\n11 2\n12 1\n13 2\n14 2\n15 2\n16 2\n17 0\n18 2\n19 1\n20 2\n21 1\n22 2\n23 -1\n24 2\n25 2\n26 2\n27 -1\n28 2\n29 2\n30 1\n31 1\n32 -1\n33 2\n34 2\n35 2\n36 2\n37 2\n38 2\n39 0\n40 2\n41 0\n42 2\n43 2\n44 2\n45 2\n46 2\n47 2\n48 2\n49 2"
},
"execution_count": 52,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 206
},
"id": "8YKn1JLAiJWl",
"outputId": "354fa645-e117-49ed-91ea-963c10fb97f9",
"trusted": false
},
"cell_type": "code",
"source": "scan2= pd.concat([scan,cl],axis=1) \nscan2.head() ",
"execution_count": null,
"outputs": [
{
"data": {
"text/html": "\n <div id=\"df-efcfa550-d771-472e-8fd5-4e47547df23e\">\n <div class=\"colab-df-container\">\n <div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Unnamed: 0</th>\n <th>Murder</th>\n <th>Assault</th>\n <th>UrbanPop</th>\n <th>Rape</th>\n <th>cluster</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>Alabama</td>\n <td>13.2</td>\n <td>236</td>\n <td>58</td>\n <td>21.2</td>\n <td>0</td>\n </tr>\n <tr>\n <th>1</th>\n <td>Alaska</td>\n <td>10.0</td>\n <td>263</td>\n <td>48</td>\n <td>44.5</td>\n <td>-1</td>\n </tr>\n <tr>\n <th>2</th>\n <td>Arizona</td>\n <td>8.1</td>\n <td>294</td>\n <td>80</td>\n <td>31.0</td>\n <td>1</td>\n </tr>\n <tr>\n <th>3</th>\n <td>Arkansas</td>\n <td>8.8</td>\n <td>190</td>\n <td>50</td>\n <td>19.5</td>\n <td>2</td>\n </tr>\n <tr>\n <th>4</th>\n <td>California</td>\n <td>9.0</td>\n <td>276</td>\n <td>91</td>\n <td>40.6</td>\n <td>-1</td>\n </tr>\n </tbody>\n</table>\n</div>\n <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-efcfa550-d771-472e-8fd5-4e47547df23e')\"\n title=\"Convert this dataframe to an interactive table.\"\n style=\"display:none;\">\n \n <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n width=\"24px\">\n <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n </svg>\n </button>\n \n <style>\n .colab-df-container {\n display:flex;\n flex-wrap:wrap;\n gap: 12px;\n }\n\n .colab-df-convert {\n background-color: #E8F0FE;\n border: none;\n border-radius: 50%;\n cursor: pointer;\n display: none;\n fill: #1967D2;\n height: 32px;\n padding: 0 0 0 0;\n width: 32px;\n }\n\n .colab-df-convert:hover {\n background-color: #E2EBFA;\n box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n fill: #174EA6;\n }\n\n [theme=dark] .colab-df-convert {\n background-color: #3B4455;\n fill: #D2E3FC;\n }\n\n [theme=dark] .colab-df-convert:hover {\n background-color: #434B5C;\n box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n fill: #FFFFFF;\n }\n </style>\n\n <script>\n const buttonEl =\n document.querySelector('#df-efcfa550-d771-472e-8fd5-4e47547df23e button.colab-df-convert');\n buttonEl.style.display =\n google.colab.kernel.accessAllowed ? 'block' : 'none';\n\n async function convertToInteractive(key) {\n const element = document.querySelector('#df-efcfa550-d771-472e-8fd5-4e47547df23e');\n const dataTable =\n await google.colab.kernel.invokeFunction('convertToInteractive',\n [key], {});\n if (!dataTable) return;\n\n const docLinkHtml = 'Like what you see? Visit the ' +\n '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n + ' to learn more about interactive tables.';\n element.innerHTML = '';\n dataTable['output_type'] = 'display_data';\n await google.colab.output.renderOutput(dataTable, element);\n const docLink = document.createElement('div');\n docLink.innerHTML = docLinkHtml;\n element.appendChild(docLink);\n }\n </script>\n </div>\n </div>\n ",
"text/plain": " Unnamed: 0 Murder Assault UrbanPop Rape cluster\n0 Alabama 13.2 236 58 21.2 0\n1 Alaska 10.0 263 48 44.5 -1\n2 Arizona 8.1 294 80 31.0 1\n3 Arkansas 8.8 190 50 19.5 2\n4 California 9.0 276 91 40.6 -1"
},
"execution_count": 53,
"metadata": {},
"output_type": "execute_result"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 287
},
"id": "ZthAicAwiY2f",
"outputId": "e671d694-e116-41ae-f282-f8aff05ede57",
"trusted": false
},
"cell_type": "code",
"source": "scan2.plot(x =\"Assault\",y =\"Rape\",c=dbscan.labels_ ,kind=\"scatter\",s=50 ,cmap=plt.cm.copper_r) \nplt.title('Clusters using DBScan') ",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "Text(0.5, 1.0, 'Clusters using DBScan')"
},
"execution_count": 54,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": "<Figure size 432x288 with 2 Axes>"
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
]
},
{
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "SFdItfOeinda",
"outputId": "7977f2c9-0f95-4028-9bd3-e36a723e1447",
"trusted": false
},
"cell_type": "code",
"source": "dl = dbscan.labels_ \nimport sklearn\nsklearn.metrics.silhouette_score(x, dl) ",
"execution_count": null,
"outputs": [
{
"data": {
"text/plain": "0.23869670053300915"
},
"execution_count": 55,
"metadata": {},
"output_type": "execute_result"
}
]
}
],
"metadata": {
"colab": {
"provenance": []
},
"kernelspec": {
"name": "python3",
"display_name": "Python 3 (ipykernel)",
"language": "python"
},
"language_info": {
"name": "python",
"version": "3.9.13",
"mimetype": "text/x-python",
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"pygments_lexer": "ipython3",
"nbconvert_exporter": "python",
"file_extension": ".py"
},
"gist": {
"id": "",
"data": {
"description": "!excelR/assignments/Gists/crime_data_clustering_assgn.ipynb",
"public": true
}
}
},
"nbformat": 4,
"nbformat_minor": 1
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment