From 7d91a84b42d1f6e8660d4d1e6fc260ca48bf5bc3 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E2=80=9Cdanielmdepaoli=E2=80=9D?= <“danielmdepaoli@gmail.com”> Date: Sat, 26 Aug 2023 13:10:47 +0100 Subject: [PATCH] Lab Done --- your-code/main.ipynb | 1247 ++++++++++++++++++++++++++++++++++++++---- 1 file changed, 1134 insertions(+), 113 deletions(-) diff --git a/your-code/main.ipynb b/your-code/main.ipynb index a5caf8b..482ec74 100755 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -37,13 +37,236 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 19, "metadata": {}, "outputs": [], "source": [ "websites = pd.read_csv('../data/website.csv')" ] }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | URL | \n", + "URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "CONTENT_LENGTH | \n", + "WHOIS_COUNTRY | \n", + "WHOIS_STATEPRO | \n", + "WHOIS_REGDATE | \n", + "WHOIS_UPDATED_DATE | \n", + "... | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "M0_109 | \n", + "16 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "263.0 | \n", + "None | \n", + "None | \n", + "10/10/2015 18:21 | \n", + "None | \n", + "... | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "9 | \n", + "10 | \n", + "1153 | \n", + "832 | \n", + "9 | \n", + "2.0 | \n", + "1 | \n", + "
| 1 | \n", + "B0_2314 | \n", + "16 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache/2.4.10 | \n", + "15087.0 | \n", + "None | \n", + "None | \n", + "None | \n", + "None | \n", + "... | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "17 | \n", + "19 | \n", + "1265 | \n", + "1230 | \n", + "17 | \n", + "0.0 | \n", + "0 | \n", + "
| 2 | \n", + "B0_911 | \n", + "16 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft-HTTPAPI/2.0 | \n", + "324.0 | \n", + "None | \n", + "None | \n", + "None | \n", + "None | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 3 | \n", + "B0_113 | \n", + "17 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "162.0 | \n", + "US | \n", + "AK | \n", + "7/10/1997 4:00 | \n", + "12/09/2013 0:45 | \n", + "... | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "39 | \n", + "37 | \n", + "18784 | \n", + "4380 | \n", + "39 | \n", + "8.0 | \n", + "0 | \n", + "
| 4 | \n", + "B0_403 | \n", + "17 | \n", + "6 | \n", + "UTF-8 | \n", + "None | \n", + "124140.0 | \n", + "US | \n", + "TX | \n", + "12/05/1996 0:00 | \n", + "11/04/2017 0:00 | \n", + "... | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "61 | \n", + "62 | \n", + "129889 | \n", + "4586 | \n", + "61 | \n", + "4.0 | \n", + "0 | \n", + "
5 rows × 21 columns
\n", + "| \n", + " | URL_LENGTH | \n", + "TCP_CONVERSATION_EXCHANGE | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "CHARSET_ISO-8859 | \n", + "... | \n", + "WHOIS_COUNTRY_AU | \n", + "WHOIS_COUNTRY_CA | \n", + "WHOIS_COUNTRY_ES | \n", + "WHOIS_COUNTRY_IN | \n", + "WHOIS_COUNTRY_JP | \n", + "WHOIS_COUNTRY_None | \n", + "WHOIS_COUNTRY_OTHER | \n", + "WHOIS_COUNTRY_PA | \n", + "WHOIS_COUNTRY_UK | \n", + "WHOIS_COUNTRY_US | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "16 | \n", + "7 | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "1153 | \n", + "832 | \n", + "2.0 | \n", + "1 | \n", + "0 | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 1 | \n", + "16 | \n", + "17 | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "1265 | \n", + "1230 | \n", + "0.0 | \n", + "0 | \n", + "0 | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 2 | \n", + "16 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "0 | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 3 | \n", + "17 | \n", + "31 | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "18784 | \n", + "4380 | \n", + "8.0 | \n", + "0 | \n", + "0 | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| 4 | \n", + "17 | \n", + "57 | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "129889 | \n", + "4586 | \n", + "4.0 | \n", + "0 | \n", + "0 | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
5 rows × 32 columns
\n", + "LogisticRegression()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LogisticRegression()
KNeighborsClassifier(n_neighbors=3)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
KNeighborsClassifier(n_neighbors=3)
KNeighborsClassifier()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
KNeighborsClassifier()