diff --git a/data/website.csv b/your-code/data/website.csv old mode 100755 new mode 100644 similarity index 100% rename from data/website.csv rename to your-code/data/website.csv diff --git a/your-code/main.ipynb b/your-code/main.ipynb index a5caf8b..8a59812 100755 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -21,7 +21,8 @@ "%matplotlib inline\n", "\n", "import numpy as np\n", - "import pandas as pd" + "import pandas as pd\n", + "import pyforest" ] }, { @@ -41,7 +42,7 @@ "metadata": {}, "outputs": [], "source": [ - "websites = pd.read_csv('../data/website.csv')" + "websites = pd.read_csv('./data/website.csv')" ] }, { @@ -67,18 +68,279 @@ "cell_type": "code", "execution_count": 3, "metadata": {}, - "outputs": [], - "source": [ - "# Your code here\n" + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | URL | \n", + "URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "CONTENT_LENGTH | \n", + "WHOIS_COUNTRY | \n", + "WHOIS_STATEPRO | \n", + "WHOIS_REGDATE | \n", + "WHOIS_UPDATED_DATE | \n", + "... | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "M0_109 | \n", + "16 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "263.0 | \n", + "None | \n", + "None | \n", + "10/10/2015 18:21 | \n", + "None | \n", + "... | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "9 | \n", + "10 | \n", + "1153 | \n", + "832 | \n", + "9 | \n", + "2.0 | \n", + "1 | \n", + "
| 1 | \n", + "B0_2314 | \n", + "16 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache/2.4.10 | \n", + "15087.0 | \n", + "None | \n", + "None | \n", + "None | \n", + "None | \n", + "... | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "17 | \n", + "19 | \n", + "1265 | \n", + "1230 | \n", + "17 | \n", + "0.0 | \n", + "0 | \n", + "
| 2 | \n", + "B0_911 | \n", + "16 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft-HTTPAPI/2.0 | \n", + "324.0 | \n", + "None | \n", + "None | \n", + "None | \n", + "None | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 3 | \n", + "B0_113 | \n", + "17 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "162.0 | \n", + "US | \n", + "AK | \n", + "7/10/1997 4:00 | \n", + "12/09/2013 0:45 | \n", + "... | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "39 | \n", + "37 | \n", + "18784 | \n", + "4380 | \n", + "39 | \n", + "8.0 | \n", + "0 | \n", + "
| 4 | \n", + "B0_403 | \n", + "17 | \n", + "6 | \n", + "UTF-8 | \n", + "None | \n", + "124140.0 | \n", + "US | \n", + "TX | \n", + "12/05/1996 0:00 | \n", + "11/04/2017 0:00 | \n", + "... | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "61 | \n", + "62 | \n", + "129889 | \n", + "4586 | \n", + "61 | \n", + "4.0 | \n", + "0 | \n", + "
5 rows × 21 columns
\n", + "LogisticRegression()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LogisticRegression()
KNeighborsClassifier(n_neighbors=3)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
KNeighborsClassifier(n_neighbors=3)
KNeighborsClassifier()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
KNeighborsClassifier()