diff --git a/your-code/main.ipynb b/your-code/main.ipynb index a5caf8b..f926324 100755 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -21,7 +21,8 @@ "%matplotlib inline\n", "\n", "import numpy as np\n", - "import pandas as pd" + "import pandas as pd\n", + "import matplotlib.pyplot as plt" ] }, { @@ -67,18 +68,267 @@ "cell_type": "code", "execution_count": 3, "metadata": {}, - "outputs": [], - "source": [ - "# Your code here\n" + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | URL | \n", + "URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "CONTENT_LENGTH | \n", + "WHOIS_COUNTRY | \n", + "WHOIS_STATEPRO | \n", + "WHOIS_REGDATE | \n", + "WHOIS_UPDATED_DATE | \n", + "... | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "M0_109 | \n", + "16 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "263.0 | \n", + "None | \n", + "None | \n", + "10/10/2015 18:21 | \n", + "None | \n", + "... | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "9 | \n", + "10 | \n", + "1153 | \n", + "832 | \n", + "9 | \n", + "2.0 | \n", + "1 | \n", + "
| 1 | \n", + "B0_2314 | \n", + "16 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache/2.4.10 | \n", + "15087.0 | \n", + "None | \n", + "None | \n", + "None | \n", + "None | \n", + "... | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "17 | \n", + "19 | \n", + "1265 | \n", + "1230 | \n", + "17 | \n", + "0.0 | \n", + "0 | \n", + "
| 2 | \n", + "B0_911 | \n", + "16 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft-HTTPAPI/2.0 | \n", + "324.0 | \n", + "None | \n", + "None | \n", + "None | \n", + "None | \n", + "... | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 3 | \n", + "B0_113 | \n", + "17 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "162.0 | \n", + "US | \n", + "AK | \n", + "7/10/1997 4:00 | \n", + "12/09/2013 0:45 | \n", + "... | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "39 | \n", + "37 | \n", + "18784 | \n", + "4380 | \n", + "39 | \n", + "8.0 | \n", + "0 | \n", + "
| 4 | \n", + "B0_403 | \n", + "17 | \n", + "6 | \n", + "UTF-8 | \n", + "None | \n", + "124140.0 | \n", + "US | \n", + "TX | \n", + "12/05/1996 0:00 | \n", + "11/04/2017 0:00 | \n", + "... | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "61 | \n", + "62 | \n", + "129889 | \n", + "4586 | \n", + "61 | \n", + "4.0 | \n", + "0 | \n", + "
5 rows × 21 columns
\n", + "| \n", + " | URL_LENGTH | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CONTENT_LENGTH | \n", + "TCP_CONVERSATION_EXCHANGE | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_PACKETS | \n", + "REMOTE_APP_PACKETS | \n", + "SOURCE_APP_BYTES | \n", + "REMOTE_APP_BYTES | \n", + "APP_PACKETS | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| URL_LENGTH | \n", + "1.000000 | \n", + "0.917986 | \n", + "0.129745 | \n", + "-0.038407 | \n", + "-0.039839 | \n", + "-0.046367 | \n", + "-0.026446 | \n", + "-0.042264 | \n", + "-0.033779 | \n", + "-0.014857 | \n", + "-0.026686 | \n", + "-0.042264 | \n", + "-0.068582 | \n", + "0.162104 | \n", + "
| NUMBER_SPECIAL_CHARACTERS | \n", + "0.917986 | \n", + "1.000000 | \n", + "0.214225 | \n", + "-0.037459 | \n", + "-0.042619 | \n", + "-0.047103 | \n", + "-0.023914 | \n", + "-0.040096 | \n", + "-0.030597 | \n", + "-0.014376 | \n", + "-0.024098 | \n", + "-0.040096 | \n", + "-0.050048 | \n", + "0.280897 | \n", + "
| CONTENT_LENGTH | \n", + "0.129745 | \n", + "0.214225 | \n", + "1.000000 | \n", + "0.078451 | \n", + "-0.000381 | \n", + "0.004774 | \n", + "0.051202 | \n", + "0.074142 | \n", + "0.091077 | \n", + "0.100094 | \n", + "0.047595 | \n", + "0.074142 | \n", + "-0.045644 | \n", + "-0.090852 | \n", + "
| TCP_CONVERSATION_EXCHANGE | \n", + "-0.038407 | \n", + "-0.037459 | \n", + "0.078451 | \n", + "1.000000 | \n", + "0.555188 | \n", + "0.331080 | \n", + "0.457320 | \n", + "0.997796 | \n", + "0.990848 | \n", + "0.865580 | \n", + "0.458702 | \n", + "0.997796 | \n", + "0.349832 | \n", + "-0.040202 | \n", + "
| DIST_REMOTE_TCP_PORT | \n", + "-0.039839 | \n", + "-0.042619 | \n", + "-0.000381 | \n", + "0.555188 | \n", + "1.000000 | \n", + "0.210188 | \n", + "0.780238 | \n", + "0.558612 | \n", + "0.591188 | \n", + "0.313359 | \n", + "0.781212 | \n", + "0.558612 | \n", + "0.259942 | \n", + "-0.082925 | \n", + "
| REMOTE_IPS | \n", + "-0.046367 | \n", + "-0.047103 | \n", + "0.004774 | \n", + "0.331080 | \n", + "0.210188 | \n", + "1.000000 | \n", + "0.023126 | \n", + "0.361104 | \n", + "0.304683 | \n", + "0.171651 | \n", + "0.025324 | \n", + "0.361104 | \n", + "0.548189 | \n", + "-0.078783 | \n", + "
| APP_BYTES | \n", + "-0.026446 | \n", + "-0.023914 | \n", + "0.051202 | \n", + "0.457320 | \n", + "0.780238 | \n", + "0.023126 | \n", + "1.000000 | \n", + "0.445822 | \n", + "0.468999 | \n", + "0.074464 | \n", + "0.999992 | \n", + "0.445822 | \n", + "0.012221 | \n", + "-0.011262 | \n", + "
| SOURCE_APP_PACKETS | \n", + "-0.042264 | \n", + "-0.040096 | \n", + "0.074142 | \n", + "0.997796 | \n", + "0.558612 | \n", + "0.361104 | \n", + "0.445822 | \n", + "1.000000 | \n", + "0.989285 | \n", + "0.857495 | \n", + "0.447448 | \n", + "1.000000 | \n", + "0.410843 | \n", + "-0.034414 | \n", + "
| REMOTE_APP_PACKETS | \n", + "-0.033779 | \n", + "-0.030597 | \n", + "0.091077 | \n", + "0.990848 | \n", + "0.591188 | \n", + "0.304683 | \n", + "0.468999 | \n", + "0.989285 | \n", + "1.000000 | \n", + "0.880555 | \n", + "0.470401 | \n", + "0.989285 | \n", + "0.355716 | \n", + "-0.032897 | \n", + "
| SOURCE_APP_BYTES | \n", + "-0.014857 | \n", + "-0.014376 | \n", + "0.100094 | \n", + "0.865580 | \n", + "0.313359 | \n", + "0.171651 | \n", + "0.074464 | \n", + "0.857495 | \n", + "0.880555 | \n", + "1.000000 | \n", + "0.075328 | \n", + "0.857495 | \n", + "0.215285 | \n", + "-0.043852 | \n", + "
| REMOTE_APP_BYTES | \n", + "-0.026686 | \n", + "-0.024098 | \n", + "0.047595 | \n", + "0.458702 | \n", + "0.781212 | \n", + "0.025324 | \n", + "0.999992 | \n", + "0.447448 | \n", + "0.470401 | \n", + "0.075328 | \n", + "1.000000 | \n", + "0.447448 | \n", + "0.016215 | \n", + "-0.011004 | \n", + "
| APP_PACKETS | \n", + "-0.042264 | \n", + "-0.040096 | \n", + "0.074142 | \n", + "0.997796 | \n", + "0.558612 | \n", + "0.361104 | \n", + "0.445822 | \n", + "1.000000 | \n", + "0.989285 | \n", + "0.857495 | \n", + "0.447448 | \n", + "1.000000 | \n", + "0.410843 | \n", + "-0.034414 | \n", + "
| DNS_QUERY_TIMES | \n", + "-0.068582 | \n", + "-0.050048 | \n", + "-0.045644 | \n", + "0.349832 | \n", + "0.259942 | \n", + "0.548189 | \n", + "0.012221 | \n", + "0.410843 | \n", + "0.355716 | \n", + "0.215285 | \n", + "0.016215 | \n", + "0.410843 | \n", + "1.000000 | \n", + "0.068753 | \n", + "
| Type | \n", + "0.162104 | \n", + "0.280897 | \n", + "-0.090852 | \n", + "-0.040202 | \n", + "-0.082925 | \n", + "-0.078783 | \n", + "-0.011262 | \n", + "-0.034414 | \n", + "-0.032897 | \n", + "-0.043852 | \n", + "-0.011004 | \n", + "-0.034414 | \n", + "0.068753 | \n", + "1.000000 | \n", + "
| \n", + " | URL | \n", + "NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "WHOIS_COUNTRY | \n", + "TCP_CONVERSATION_EXCHANGE | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_BYTES | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "M0_109 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "OTHER | \n", + "7 | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "1153 | \n", + "2.0 | \n", + "1 | \n", + "
| 1 | \n", + "B0_2314 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache/2.4.10 | \n", + "OTHER | \n", + "17 | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "1265 | \n", + "0.0 | \n", + "0 | \n", + "
| 2 | \n", + "B0_911 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft-HTTPAPI/2.0 | \n", + "OTHER | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "
| 3 | \n", + "B0_113 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "US | \n", + "31 | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "18784 | \n", + "8.0 | \n", + "0 | \n", + "
| 4 | \n", + "B0_403 | \n", + "6 | \n", + "UTF-8 | \n", + "None | \n", + "US | \n", + "57 | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "129889 | \n", + "4.0 | \n", + "0 | \n", + "
| \n", + " | NUMBER_SPECIAL_CHARACTERS | \n", + "CHARSET | \n", + "SERVER | \n", + "WHOIS_COUNTRY | \n", + "TCP_CONVERSATION_EXCHANGE | \n", + "DIST_REMOTE_TCP_PORT | \n", + "REMOTE_IPS | \n", + "APP_BYTES | \n", + "SOURCE_APP_BYTES | \n", + "DNS_QUERY_TIMES | \n", + "Type | \n", + "Apache | \n", + "Microsoft | \n", + "Other | \n", + "nginx | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "7 | \n", + "iso-8859-1 | \n", + "nginx | \n", + "OTHER | \n", + "7 | \n", + "0 | \n", + "2 | \n", + "700 | \n", + "1153 | \n", + "2.0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| 1 | \n", + "6 | \n", + "UTF-8 | \n", + "Apache | \n", + "OTHER | \n", + "17 | \n", + "7 | \n", + "4 | \n", + "1230 | \n", + "1265 | \n", + "0.0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 2 | \n", + "6 | \n", + "us-ascii | \n", + "Microsoft | \n", + "OTHER | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "
| 3 | \n", + "6 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "US | \n", + "31 | \n", + "22 | \n", + "3 | \n", + "3812 | \n", + "18784 | \n", + "8.0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| 4 | \n", + "6 | \n", + "UTF-8 | \n", + "Other | \n", + "US | \n", + "57 | \n", + "2 | \n", + "5 | \n", + "4278 | \n", + "129889 | \n", + "4.0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 1776 | \n", + "16 | \n", + "UTF-8 | \n", + "Apache | \n", + "ES | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "186 | \n", + "0.0 | \n", + "1 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 1777 | \n", + "17 | \n", + "UTF-8 | \n", + "Apache | \n", + "ES | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "124 | \n", + "0.0 | \n", + "1 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 1778 | \n", + "34 | \n", + "utf-8 | \n", + "Apache | \n", + "US | \n", + "83 | \n", + "2 | \n", + "6 | \n", + "6631 | \n", + "132181 | \n", + "4.0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 1779 | \n", + "34 | \n", + "ISO-8859-1 | \n", + "nginx | \n", + "US | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0.0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| 1780 | \n", + "40 | \n", + "utf-8 | \n", + "Microsoft | \n", + "US | \n", + "19 | \n", + "6 | \n", + "11 | \n", + "2314 | \n", + "3039 | \n", + "6.0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "
1779 rows × 15 columns
\n", + "LogisticRegression()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LogisticRegression()
KNeighborsClassifier(n_neighbors=3)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
KNeighborsClassifier(n_neighbors=3)