diff --git a/your-code/main.ipynb b/your-code/main.ipynb index a5caf8b..c7aa3af 100755 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -20,8 +20,11 @@ "\n", "%matplotlib inline\n", "\n", + "\n", "import numpy as np\n", - "import pandas as pd" + "import pandas as pd\n", + "import seaborn as sns\n", + "import matplotlib.pyplot as plt" ] }, { @@ -65,11 +68,289 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | URL | \n", + "URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "CONTENT_LENGTH | \n", + "WHOIS_COUNTRY | \n", + "WHOIS_STATEPRO | \n", + "WHOIS_REGDATE | \n", + "WHOIS_UPDATED_DATE | \n", + "... | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "M0_109 | \n", + "16 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "263.0 | \n", + "NaN | \n", + "NaN | \n", + "10/10/2015 18:21 | \n", + "NaN | \n", + "... | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "9 | \n", + "10 | \n", + "1153 | \n", + "832 | \n", + "9 | \n", + "2.0 | \n", + "1 | \n", + "
| 1 | \n", + "B0_2314 | \n", + "16 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache/2.4.10 | \n", + "15087.0 | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "... | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "17 | \n", + "19 | \n", + "1265 | \n", + "1230 | \n", + "17 | \n", + "0.0 | \n", + "0 | \n", + "
| 2 | \n", + "B0_911 | \n", + "16 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft-HTTPAPI/2.0 | \n", + "324.0 | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 3 | \n", + "B0_113 | \n", + "17 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "162.0 | \n", + "US | \n", + "AK | \n", + "7/10/1997 4:00 | \n", + "12/09/2013 0:45 | \n", + "... | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "39 | \n", + "37 | \n", + "18784 | \n", + "4380 | \n", + "39 | \n", + "8.0 | \n", + "0 | \n", + "
| 4 | \n", + "B0_403 | \n", + "17 | \n", + "6 | \n", + "UTF-8 | \n", + "NaN | \n", + "124140.0 | \n", + "US | \n", + "TX | \n", + "12/05/1996 0:00 | \n", + "11/04/2017 0:00 | \n", + "... | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "61 | \n", + "62 | \n", + "129889 | \n", + "4586 | \n", + "61 | \n", + "4.0 | \n", + "0 | \n", + "
5 rows × 21 columns
\n", + "| \n", + " | URL | \n", + "URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "CONTENT_LENGTH | \n", + "WHOIS_COUNTRY | \n", + "WHOIS_STATEPRO | \n", + "WHOIS_REGDATE | \n", + "WHOIS_UPDATED_DATE | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "M0_109 | \n", + "16 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "263.0 | \n", + "NaN | \n", + "NaN | \n", + "10/10/2015 18:21 | \n", + "NaN | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "9 | \n", + "10 | \n", + "1153 | \n", + "832 | \n", + "9 | \n", + "2.0 | \n", + "1 | \n", + "
| 1 | \n", + "B0_2314 | \n", + "16 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache/2.4.10 | \n", + "15087.0 | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "17 | \n", + "19 | \n", + "1265 | \n", + "1230 | \n", + "17 | \n", + "0.0 | \n", + "0 | \n", + "
| 2 | \n", + "B0_911 | \n", + "16 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft-HTTPAPI/2.0 | \n", + "324.0 | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 3 | \n", + "B0_113 | \n", + "17 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "162.0 | \n", + "US | \n", + "AK | \n", + "7/10/1997 4:00 | \n", + "12/09/2013 0:45 | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "39 | \n", + "37 | \n", + "18784 | \n", + "4380 | \n", + "39 | \n", + "8.0 | \n", + "0 | \n", + "
| 4 | \n", + "B0_403 | \n", + "17 | \n", + "6 | \n", + "UTF-8 | \n", + "NaN | \n", + "124140.0 | \n", + "US | \n", + "TX | \n", + "12/05/1996 0:00 | \n", + "11/04/2017 0:00 | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "61 | \n", + "62 | \n", + "129889 | \n", + "4586 | \n", + "61 | \n", + "4.0 | \n", + "0 | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 1776 | \n", + "M4_48 | \n", + "194 | \n", + "16 | \n", + "UTF-8 | \n", + "Apache | \n", + "NaN | \n", + "ES | \n", + "Barcelona | \n", + "17/09/2008 0:00 | \n", + "2/09/2016 0:00 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "3 | \n", + "186 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "1 | \n", + "
| 1777 | \n", + "M4_41 | \n", + "198 | \n", + "17 | \n", + "UTF-8 | \n", + "Apache | \n", + "NaN | \n", + "ES | \n", + "Barcelona | \n", + "17/09/2008 0:00 | \n", + "2/09/2016 0:00 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "2 | \n", + "124 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "1 | \n", + "
| 1778 | \n", + "B0_162 | \n", + "201 | \n", + "34 | \n", + "utf-8 | \n", + "Apache/2.2.16 (Debian) | \n", + "8904.0 | \n", + "US | \n", + "FL | \n", + "15/02/1999 0:00 | \n", + "15/07/2015 0:00 | \n", + "2 | \n", + "6 | \n", + "6631 | \n", + "87 | \n", + "89 | \n", + "132181 | \n", + "6945 | \n", + "87 | \n", + "4.0 | \n", + "0 | \n", + "
| 1779 | \n", + "B0_1152 | \n", + "234 | \n", + "34 | \n", + "ISO-8859-1 | \n", + "cloudflare-nginx | \n", + "NaN | \n", + "US | \n", + "CA | \n", + "1/04/1998 0:00 | \n", + "9/12/2016 0:00 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 1780 | \n", + "B0_676 | \n", + "249 | \n", + "40 | \n", + "utf-8 | \n", + "Microsoft-IIS/8.5 | \n", + "24435.0 | \n", + "US | \n", + "Wisconsin | \n", + "14/11/2008 0:00 | \n", + "20/11/2013 0:00 | \n", + "6 | \n", + "11 | \n", + "2314 | \n", + "25 | \n", + "28 | \n", + "3039 | \n", + "2776 | \n", + "25 | \n", + "6.0 | \n", + "0 | \n", + "
1781 rows × 20 columns
\n", + "| \n", + " | URL | \n", + "URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "WHOIS_COUNTRY | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 3 | \n", + "B0_113 | \n", + "17 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "US | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "39 | \n", + "37 | \n", + "18784 | \n", + "4380 | \n", + "39 | \n", + "8.0 | \n", + "0 | \n", + "
| 5 | \n", + "B0_2064 | \n", + "18 | \n", + "7 | \n", + "UTF-8 | \n", + "nginx | \n", + "OTHER | \n", + "6 | \n", + "9 | \n", + "894 | \n", + "11 | \n", + "13 | \n", + "838 | \n", + "894 | \n", + "11 | \n", + "0.0 | \n", + "0 | \n", + "
LogisticRegression(random_state=42)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LogisticRegression(random_state=42)
KNeighborsClassifier(n_neighbors=3)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
KNeighborsClassifier(n_neighbors=3)