diff --git a/.ipynb_checkpoints/Answers_2018-01-18-checkpoint.ipynb b/.ipynb_checkpoints/Answers_2018-01-18-checkpoint.ipynb new file mode 100644 index 0000000..9d2e72b --- /dev/null +++ b/.ipynb_checkpoints/Answers_2018-01-18-checkpoint.ipynb @@ -0,0 +1,1025 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from sklearn.linear_model import LogisticRegression\n", + "from sklearn.metrics import confusion_matrix\n", + "from sklearn.model_selection import train_test_split\n", + "from sklearn.model_selection import cross_val_score\n", + "from pandas.plotting import scatter_matrix\n", + "from itertools import combinations\n", + "%matplotlib inline" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | admit | \n", + "gre | \n", + "gpa | \n", + "rank | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0 | \n", + "380 | \n", + "3.61 | \n", + "3 | \n", + "
| 1 | \n", + "1 | \n", + "660 | \n", + "3.67 | \n", + "3 | \n", + "
| 2 | \n", + "1 | \n", + "800 | \n", + "4.00 | \n", + "1 | \n", + "
| 3 | \n", + "1 | \n", + "640 | \n", + "3.19 | \n", + "4 | \n", + "
| 4 | \n", + "0 | \n", + "520 | \n", + "2.93 | \n", + "4 | \n", + "
| \n", + " | admit | \n", + "gre | \n", + "gpa | \n", + "rank | \n", + "
|---|---|---|---|---|
| count | \n", + "400.000000 | \n", + "400.000000 | \n", + "400.000000 | \n", + "400.00000 | \n", + "
| mean | \n", + "0.317500 | \n", + "587.700000 | \n", + "3.389900 | \n", + "2.48500 | \n", + "
| std | \n", + "0.466087 | \n", + "115.516536 | \n", + "0.380567 | \n", + "0.94446 | \n", + "
| min | \n", + "0.000000 | \n", + "220.000000 | \n", + "2.260000 | \n", + "1.00000 | \n", + "
| 25% | \n", + "0.000000 | \n", + "520.000000 | \n", + "3.130000 | \n", + "2.00000 | \n", + "
| 50% | \n", + "0.000000 | \n", + "580.000000 | \n", + "3.395000 | \n", + "2.00000 | \n", + "
| 75% | \n", + "1.000000 | \n", + "660.000000 | \n", + "3.670000 | \n", + "3.00000 | \n", + "
| max | \n", + "1.000000 | \n", + "800.000000 | \n", + "4.000000 | \n", + "4.00000 | \n", + "
| rank | \n", + "1 | \n", + "2 | \n", + "3 | \n", + "4 | \n", + "
|---|---|---|---|---|
| admit | \n", + "\n", + " | \n", + " | \n", + " | \n", + " |
| 0 | \n", + "28 | \n", + "97 | \n", + "93 | \n", + "55 | \n", + "
| 1 | \n", + "33 | \n", + "54 | \n", + "28 | \n", + "12 | \n", + "
| \n", + " | admit | \n", + "gre | \n", + "gpa | \n", + "rank | \n", + "rank1 | \n", + "rank2 | \n", + "rank3 | \n", + "rank4 | \n", + "
|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "0 | \n", + "380 | \n", + "3.61 | \n", + "3 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "
| 1 | \n", + "1 | \n", + "660 | \n", + "3.67 | \n", + "3 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "
| 2 | \n", + "1 | \n", + "800 | \n", + "4.00 | \n", + "1 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 3 | \n", + "1 | \n", + "640 | \n", + "3.19 | \n", + "4 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| 4 | \n", + "0 | \n", + "520 | \n", + "2.93 | \n", + "4 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| \n", + " | Accuracy | \n", + "Columns | \n", + "
|---|---|---|
| 0 | \n", + "0.682570 | \n", + "(gre,) | \n", + "
| 1 | \n", + "0.682570 | \n", + "(gpa,) | \n", + "
| 2 | \n", + "0.684817 | \n", + "(rank1,) | \n", + "
| 3 | \n", + "0.682570 | \n", + "(rank2,) | \n", + "
| 4 | \n", + "0.682570 | \n", + "(rank3,) | \n", + "
| 5 | \n", + "0.682570 | \n", + "(rank4,) | \n", + "
| 6 | \n", + "0.682570 | \n", + "(gre, gpa) | \n", + "
| 7 | \n", + "0.689759 | \n", + "(gre, rank1) | \n", + "
| 8 | \n", + "0.682570 | \n", + "(gre, rank2) | \n", + "
| 9 | \n", + "0.674878 | \n", + "(gre, rank3) | \n", + "
| 10 | \n", + "0.682570 | \n", + "(gre, rank4) | \n", + "
| 11 | \n", + "0.714576 | \n", + "(gpa, rank1) | \n", + "
| 12 | \n", + "0.682570 | \n", + "(gpa, rank2) | \n", + "
| 13 | \n", + "0.682570 | \n", + "(gpa, rank3) | \n", + "
| 14 | \n", + "0.682570 | \n", + "(gpa, rank4) | \n", + "
| 15 | \n", + "0.670000 | \n", + "(rank1, rank2) | \n", + "
| 16 | \n", + "0.684817 | \n", + "(rank1, rank3) | \n", + "
| 17 | \n", + "0.684817 | \n", + "(rank1, rank4) | \n", + "
| 18 | \n", + "0.682570 | \n", + "(rank2, rank3) | \n", + "
| 19 | \n", + "0.682570 | \n", + "(rank2, rank4) | \n", + "
| 20 | \n", + "0.682570 | \n", + "(rank3, rank4) | \n", + "
| 21 | \n", + "0.687320 | \n", + "(gre, gpa, rank1) | \n", + "
| 22 | \n", + "0.682570 | \n", + "(gre, gpa, rank2) | \n", + "
| 23 | \n", + "0.680006 | \n", + "(gre, gpa, rank3) | \n", + "
| 24 | \n", + "0.680006 | \n", + "(gre, gpa, rank4) | \n", + "
| 25 | \n", + "0.687259 | \n", + "(gre, rank1, rank2) | \n", + "
| 26 | \n", + "0.689759 | \n", + "(gre, rank1, rank3) | \n", + "
| 27 | \n", + "0.689759 | \n", + "(gre, rank1, rank4) | \n", + "
| 28 | \n", + "0.677567 | \n", + "(gre, rank2, rank3) | \n", + "
| 29 | \n", + "0.682570 | \n", + "(gre, rank2, rank4) | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "
| 32 | \n", + "0.714576 | \n", + "(gpa, rank1, rank3) | \n", + "
| 33 | \n", + "0.712137 | \n", + "(gpa, rank1, rank4) | \n", + "
| 34 | \n", + "0.682570 | \n", + "(gpa, rank2, rank3) | \n", + "
| 35 | \n", + "0.682570 | \n", + "(gpa, rank2, rank4) | \n", + "
| 36 | \n", + "0.682570 | \n", + "(gpa, rank3, rank4) | \n", + "
| 37 | \n", + "0.670000 | \n", + "(rank1, rank2, rank3) | \n", + "
| 38 | \n", + "0.670000 | \n", + "(rank1, rank2, rank4) | \n", + "
| 39 | \n", + "0.684817 | \n", + "(rank1, rank3, rank4) | \n", + "
| 40 | \n", + "0.659994 | \n", + "(rank2, rank3, rank4) | \n", + "
| 41 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank2) | \n", + "
| 42 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank3) | \n", + "
| 43 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank4) | \n", + "
| 44 | \n", + "0.677567 | \n", + "(gre, gpa, rank2, rank3) | \n", + "
| 45 | \n", + "0.682570 | \n", + "(gre, gpa, rank2, rank4) | \n", + "
| 46 | \n", + "0.677631 | \n", + "(gre, gpa, rank3, rank4) | \n", + "
| 47 | \n", + "0.689759 | \n", + "(gre, rank1, rank2, rank3) | \n", + "
| 48 | \n", + "0.689759 | \n", + "(gre, rank1, rank2, rank4) | \n", + "
| 49 | \n", + "0.692259 | \n", + "(gre, rank1, rank3, rank4) | \n", + "
| 50 | \n", + "0.687259 | \n", + "(gre, rank2, rank3, rank4) | \n", + "
| 51 | \n", + "0.707076 | \n", + "(gpa, rank1, rank2, rank3) | \n", + "
| 52 | \n", + "0.712076 | \n", + "(gpa, rank1, rank2, rank4) | \n", + "
| 53 | \n", + "0.712137 | \n", + "(gpa, rank1, rank3, rank4) | \n", + "
| 54 | \n", + "0.714640 | \n", + "(gpa, rank2, rank3, rank4) | \n", + "
| 55 | \n", + "0.684817 | \n", + "(rank1, rank2, rank3, rank4) | \n", + "
| 56 | \n", + "0.687259 | \n", + "(gre, gpa, rank1, rank2, rank3) | \n", + "
| 57 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank2, rank4) | \n", + "
| 58 | \n", + "0.702262 | \n", + "(gre, gpa, rank1, rank3, rank4) | \n", + "
| 59 | \n", + "0.699701 | \n", + "(gre, gpa, rank2, rank3, rank4) | \n", + "
| 60 | \n", + "0.687259 | \n", + "(gre, rank1, rank2, rank3, rank4) | \n", + "
| 61 | \n", + "0.712137 | \n", + "(gpa, rank1, rank2, rank3, rank4) | \n", + "
62 rows × 2 columns
\n", + "| \n", + " | admit | \n", + "gre | \n", + "gpa | \n", + "rank | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0 | \n", + "380 | \n", + "3.61 | \n", + "3 | \n", + "
| 1 | \n", + "1 | \n", + "660 | \n", + "3.67 | \n", + "3 | \n", + "
| 2 | \n", + "1 | \n", + "800 | \n", + "4.00 | \n", + "1 | \n", + "
| 3 | \n", + "1 | \n", + "640 | \n", + "3.19 | \n", + "4 | \n", + "
| 4 | \n", + "0 | \n", + "520 | \n", + "2.93 | \n", + "4 | \n", + "
| \n", + " | admit | \n", + "gre | \n", + "gpa | \n", + "rank | \n", + "
|---|---|---|---|---|
| count | \n", + "400.000000 | \n", + "400.000000 | \n", + "400.000000 | \n", + "400.00000 | \n", + "
| mean | \n", + "0.317500 | \n", + "587.700000 | \n", + "3.389900 | \n", + "2.48500 | \n", + "
| std | \n", + "0.466087 | \n", + "115.516536 | \n", + "0.380567 | \n", + "0.94446 | \n", + "
| min | \n", + "0.000000 | \n", + "220.000000 | \n", + "2.260000 | \n", + "1.00000 | \n", + "
| 25% | \n", + "0.000000 | \n", + "520.000000 | \n", + "3.130000 | \n", + "2.00000 | \n", + "
| 50% | \n", + "0.000000 | \n", + "580.000000 | \n", + "3.395000 | \n", + "2.00000 | \n", + "
| 75% | \n", + "1.000000 | \n", + "660.000000 | \n", + "3.670000 | \n", + "3.00000 | \n", + "
| max | \n", + "1.000000 | \n", + "800.000000 | \n", + "4.000000 | \n", + "4.00000 | \n", + "
| rank | \n", + "1 | \n", + "2 | \n", + "3 | \n", + "4 | \n", + "
|---|---|---|---|---|
| admit | \n", + "\n", + " | \n", + " | \n", + " | \n", + " |
| 0 | \n", + "28 | \n", + "97 | \n", + "93 | \n", + "55 | \n", + "
| 1 | \n", + "33 | \n", + "54 | \n", + "28 | \n", + "12 | \n", + "
| \n", + " | admit | \n", + "gre | \n", + "gpa | \n", + "rank | \n", + "rank1 | \n", + "rank2 | \n", + "rank3 | \n", + "rank4 | \n", + "
|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "0 | \n", + "380 | \n", + "3.61 | \n", + "3 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "
| 1 | \n", + "1 | \n", + "660 | \n", + "3.67 | \n", + "3 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "
| 2 | \n", + "1 | \n", + "800 | \n", + "4.00 | \n", + "1 | \n", + "1 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "
| 3 | \n", + "1 | \n", + "640 | \n", + "3.19 | \n", + "4 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| 4 | \n", + "0 | \n", + "520 | \n", + "2.93 | \n", + "4 | \n", + "0 | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "
| \n", + " | Accuracy | \n", + "Columns | \n", + "
|---|---|---|
| 0 | \n", + "0.682570 | \n", + "(gre,) | \n", + "
| 1 | \n", + "0.682570 | \n", + "(gpa,) | \n", + "
| 2 | \n", + "0.684817 | \n", + "(rank1,) | \n", + "
| 3 | \n", + "0.682570 | \n", + "(rank2,) | \n", + "
| 4 | \n", + "0.682570 | \n", + "(rank3,) | \n", + "
| 5 | \n", + "0.682570 | \n", + "(rank4,) | \n", + "
| 6 | \n", + "0.682570 | \n", + "(gre, gpa) | \n", + "
| 7 | \n", + "0.689759 | \n", + "(gre, rank1) | \n", + "
| 8 | \n", + "0.682570 | \n", + "(gre, rank2) | \n", + "
| 9 | \n", + "0.674878 | \n", + "(gre, rank3) | \n", + "
| 10 | \n", + "0.682570 | \n", + "(gre, rank4) | \n", + "
| 11 | \n", + "0.714576 | \n", + "(gpa, rank1) | \n", + "
| 12 | \n", + "0.682570 | \n", + "(gpa, rank2) | \n", + "
| 13 | \n", + "0.682570 | \n", + "(gpa, rank3) | \n", + "
| 14 | \n", + "0.682570 | \n", + "(gpa, rank4) | \n", + "
| 15 | \n", + "0.670000 | \n", + "(rank1, rank2) | \n", + "
| 16 | \n", + "0.684817 | \n", + "(rank1, rank3) | \n", + "
| 17 | \n", + "0.684817 | \n", + "(rank1, rank4) | \n", + "
| 18 | \n", + "0.682570 | \n", + "(rank2, rank3) | \n", + "
| 19 | \n", + "0.682570 | \n", + "(rank2, rank4) | \n", + "
| 20 | \n", + "0.682570 | \n", + "(rank3, rank4) | \n", + "
| 21 | \n", + "0.687320 | \n", + "(gre, gpa, rank1) | \n", + "
| 22 | \n", + "0.682570 | \n", + "(gre, gpa, rank2) | \n", + "
| 23 | \n", + "0.680006 | \n", + "(gre, gpa, rank3) | \n", + "
| 24 | \n", + "0.680006 | \n", + "(gre, gpa, rank4) | \n", + "
| 25 | \n", + "0.687259 | \n", + "(gre, rank1, rank2) | \n", + "
| 26 | \n", + "0.689759 | \n", + "(gre, rank1, rank3) | \n", + "
| 27 | \n", + "0.689759 | \n", + "(gre, rank1, rank4) | \n", + "
| 28 | \n", + "0.677567 | \n", + "(gre, rank2, rank3) | \n", + "
| 29 | \n", + "0.682570 | \n", + "(gre, rank2, rank4) | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "
| 32 | \n", + "0.714576 | \n", + "(gpa, rank1, rank3) | \n", + "
| 33 | \n", + "0.712137 | \n", + "(gpa, rank1, rank4) | \n", + "
| 34 | \n", + "0.682570 | \n", + "(gpa, rank2, rank3) | \n", + "
| 35 | \n", + "0.682570 | \n", + "(gpa, rank2, rank4) | \n", + "
| 36 | \n", + "0.682570 | \n", + "(gpa, rank3, rank4) | \n", + "
| 37 | \n", + "0.670000 | \n", + "(rank1, rank2, rank3) | \n", + "
| 38 | \n", + "0.670000 | \n", + "(rank1, rank2, rank4) | \n", + "
| 39 | \n", + "0.684817 | \n", + "(rank1, rank3, rank4) | \n", + "
| 40 | \n", + "0.659994 | \n", + "(rank2, rank3, rank4) | \n", + "
| 41 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank2) | \n", + "
| 42 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank3) | \n", + "
| 43 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank4) | \n", + "
| 44 | \n", + "0.677567 | \n", + "(gre, gpa, rank2, rank3) | \n", + "
| 45 | \n", + "0.682570 | \n", + "(gre, gpa, rank2, rank4) | \n", + "
| 46 | \n", + "0.677631 | \n", + "(gre, gpa, rank3, rank4) | \n", + "
| 47 | \n", + "0.689759 | \n", + "(gre, rank1, rank2, rank3) | \n", + "
| 48 | \n", + "0.689759 | \n", + "(gre, rank1, rank2, rank4) | \n", + "
| 49 | \n", + "0.692259 | \n", + "(gre, rank1, rank3, rank4) | \n", + "
| 50 | \n", + "0.687259 | \n", + "(gre, rank2, rank3, rank4) | \n", + "
| 51 | \n", + "0.707076 | \n", + "(gpa, rank1, rank2, rank3) | \n", + "
| 52 | \n", + "0.712076 | \n", + "(gpa, rank1, rank2, rank4) | \n", + "
| 53 | \n", + "0.712137 | \n", + "(gpa, rank1, rank3, rank4) | \n", + "
| 54 | \n", + "0.714640 | \n", + "(gpa, rank2, rank3, rank4) | \n", + "
| 55 | \n", + "0.684817 | \n", + "(rank1, rank2, rank3, rank4) | \n", + "
| 56 | \n", + "0.687259 | \n", + "(gre, gpa, rank1, rank2, rank3) | \n", + "
| 57 | \n", + "0.692259 | \n", + "(gre, gpa, rank1, rank2, rank4) | \n", + "
| 58 | \n", + "0.702262 | \n", + "(gre, gpa, rank1, rank3, rank4) | \n", + "
| 59 | \n", + "0.699701 | \n", + "(gre, gpa, rank2, rank3, rank4) | \n", + "
| 60 | \n", + "0.687259 | \n", + "(gre, rank1, rank2, rank3, rank4) | \n", + "
| 61 | \n", + "0.712137 | \n", + "(gpa, rank1, rank2, rank3, rank4) | \n", + "
62 rows × 2 columns
\n", + "