diff --git a/Day 1/Part 3 - Classification/Decision Tree Classification/decision_tree_classification.ipynb b/Day 1/Part 3 - Classification/Decision Tree Classification/decision_tree_classification.ipynb index f601db9..d223c36 100644 --- a/Day 1/Part 3 - Classification/Decision Tree Classification/decision_tree_classification.ipynb +++ b/Day 1/Part 3 - Classification/Decision Tree Classification/decision_tree_classification.ipynb @@ -1 +1,1589 @@ -{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"name":"decision_tree_classification.ipynb","provenance":[],"collapsed_sections":[],"toc_visible":true,"machine_shape":"hm","authorship_tag":"ABX9TyP02NrvZmmq4qjp5mwU3Mr2"},"kernelspec":{"name":"python3","display_name":"Python 3"}},"cells":[{"cell_type":"markdown","metadata":{"id":"0MRC0e0KhQ0S","colab_type":"text"},"source":["# Decision Tree Classification"]},{"cell_type":"markdown","metadata":{"id":"LWd1UlMnhT2s","colab_type":"text"},"source":["## Importing the libraries"]},{"cell_type":"code","metadata":{"id":"YvGPUQaHhXfL","colab_type":"code","colab":{}},"source":["import numpy as np\n","import matplotlib.pyplot as plt\n","import pandas as pd"],"execution_count":0,"outputs":[]},{"cell_type":"markdown","metadata":{"id":"K1VMqkGvhc3-","colab_type":"text"},"source":["## Importing the dataset"]},{"cell_type":"code","metadata":{"id":"M52QDmyzhh9s","colab_type":"code","colab":{}},"source":["dataset = pd.read_csv('Social_Network_Ads.csv')\n","X = dataset.iloc[:, :-1].values\n","y = dataset.iloc[:, -1].values"],"execution_count":0,"outputs":[]},{"cell_type":"markdown","metadata":{"id":"YvxIPVyMhmKp","colab_type":"text"},"source":["## Splitting the dataset into the Training set and Test set"]},{"cell_type":"code","metadata":{"id":"AVzJWAXIhxoC","colab_type":"code","colab":{}},"source":["from sklearn.model_selection import train_test_split\n","X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.25, random_state = 0)"],"execution_count":0,"outputs":[]},{"cell_type":"code","metadata":{"id":"P3nS3-6r1i2B","colab_type":"code","outputId":"fa90271e-3c0a-43c2-ba6c-cfce4819e98e","executionInfo":{"status":"ok","timestamp":1588269312367,"user_tz":-240,"elapsed":2065,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":1000}},"source":["print(X_train)"],"execution_count":4,"outputs":[{"output_type":"stream","text":["[[ 44 39000]\n"," [ 32 120000]\n"," [ 38 50000]\n"," [ 32 135000]\n"," [ 52 21000]\n"," [ 53 104000]\n"," [ 39 42000]\n"," [ 38 61000]\n"," [ 36 50000]\n"," [ 36 63000]\n"," [ 35 25000]\n"," [ 35 50000]\n"," [ 42 73000]\n"," [ 47 49000]\n"," [ 59 29000]\n"," [ 49 65000]\n"," [ 45 131000]\n"," [ 31 89000]\n"," [ 46 82000]\n"," [ 47 51000]\n"," [ 26 15000]\n"," [ 60 102000]\n"," [ 38 112000]\n"," [ 40 107000]\n"," [ 42 53000]\n"," [ 35 59000]\n"," [ 48 41000]\n"," [ 48 134000]\n"," [ 38 113000]\n"," [ 29 148000]\n"," [ 26 15000]\n"," [ 60 42000]\n"," [ 24 19000]\n"," [ 42 149000]\n"," [ 46 96000]\n"," [ 28 59000]\n"," [ 39 96000]\n"," [ 28 89000]\n"," [ 41 72000]\n"," [ 45 26000]\n"," [ 33 69000]\n"," [ 20 82000]\n"," [ 31 74000]\n"," [ 42 80000]\n"," [ 35 72000]\n"," [ 33 149000]\n"," [ 40 71000]\n"," [ 51 146000]\n"," [ 46 79000]\n"," [ 35 75000]\n"," [ 38 51000]\n"," [ 36 75000]\n"," [ 37 78000]\n"," [ 38 61000]\n"," [ 60 108000]\n"," [ 20 82000]\n"," [ 57 74000]\n"," [ 42 65000]\n"," [ 26 80000]\n"," [ 46 117000]\n"," [ 35 61000]\n"," [ 21 68000]\n"," [ 28 44000]\n"," [ 41 87000]\n"," [ 37 33000]\n"," [ 27 90000]\n"," [ 39 42000]\n"," [ 28 123000]\n"," [ 31 118000]\n"," [ 25 87000]\n"," [ 35 71000]\n"," [ 37 70000]\n"," [ 35 39000]\n"," [ 47 23000]\n"," [ 35 147000]\n"," [ 48 138000]\n"," [ 26 86000]\n"," [ 25 79000]\n"," [ 52 138000]\n"," [ 51 23000]\n"," [ 35 60000]\n"," [ 33 113000]\n"," [ 30 107000]\n"," [ 48 33000]\n"," [ 41 80000]\n"," [ 48 96000]\n"," [ 31 18000]\n"," [ 31 71000]\n"," [ 43 129000]\n"," [ 59 76000]\n"," [ 18 44000]\n"," [ 36 118000]\n"," [ 42 90000]\n"," [ 47 30000]\n"," [ 26 43000]\n"," [ 40 78000]\n"," [ 46 59000]\n"," [ 59 42000]\n"," [ 46 74000]\n"," [ 35 91000]\n"," [ 28 59000]\n"," [ 40 57000]\n"," [ 59 143000]\n"," [ 57 26000]\n"," [ 52 38000]\n"," [ 47 113000]\n"," [ 53 143000]\n"," [ 35 27000]\n"," [ 58 101000]\n"," [ 45 45000]\n"," [ 23 82000]\n"," [ 46 23000]\n"," [ 42 65000]\n"," [ 28 84000]\n"," [ 38 59000]\n"," [ 26 84000]\n"," [ 29 28000]\n"," [ 37 71000]\n"," [ 22 55000]\n"," [ 48 35000]\n"," [ 49 28000]\n"," [ 38 65000]\n"," [ 27 17000]\n"," [ 46 28000]\n"," [ 48 141000]\n"," [ 26 17000]\n"," [ 35 97000]\n"," [ 39 59000]\n"," [ 24 27000]\n"," [ 32 18000]\n"," [ 46 88000]\n"," [ 35 58000]\n"," [ 56 60000]\n"," [ 47 34000]\n"," [ 40 72000]\n"," [ 32 100000]\n"," [ 19 21000]\n"," [ 25 90000]\n"," [ 35 88000]\n"," [ 28 32000]\n"," [ 50 20000]\n"," [ 40 59000]\n"," [ 50 44000]\n"," [ 35 72000]\n"," [ 40 142000]\n"," [ 46 32000]\n"," [ 39 71000]\n"," [ 20 74000]\n"," [ 29 75000]\n"," [ 31 76000]\n"," [ 47 25000]\n"," [ 40 61000]\n"," [ 34 112000]\n"," [ 38 80000]\n"," [ 42 75000]\n"," [ 47 47000]\n"," [ 39 75000]\n"," [ 19 25000]\n"," [ 37 80000]\n"," [ 36 60000]\n"," [ 41 52000]\n"," [ 36 125000]\n"," [ 48 29000]\n"," [ 36 126000]\n"," [ 51 134000]\n"," [ 27 57000]\n"," [ 38 71000]\n"," [ 39 61000]\n"," [ 22 27000]\n"," [ 33 60000]\n"," [ 48 74000]\n"," [ 58 23000]\n"," [ 53 72000]\n"," [ 32 117000]\n"," [ 54 70000]\n"," [ 30 80000]\n"," [ 58 95000]\n"," [ 26 52000]\n"," [ 45 79000]\n"," [ 24 55000]\n"," [ 40 75000]\n"," [ 33 28000]\n"," [ 44 139000]\n"," [ 22 18000]\n"," [ 33 51000]\n"," [ 43 133000]\n"," [ 24 32000]\n"," [ 46 22000]\n"," [ 35 55000]\n"," [ 54 104000]\n"," [ 48 119000]\n"," [ 35 53000]\n"," [ 37 144000]\n"," [ 23 66000]\n"," [ 37 137000]\n"," [ 31 58000]\n"," [ 33 41000]\n"," [ 45 22000]\n"," [ 30 15000]\n"," [ 19 19000]\n"," [ 49 74000]\n"," [ 39 122000]\n"," [ 35 73000]\n"," [ 39 71000]\n"," [ 24 23000]\n"," [ 41 72000]\n"," [ 29 83000]\n"," [ 54 26000]\n"," [ 35 44000]\n"," [ 37 75000]\n"," [ 29 47000]\n"," [ 31 68000]\n"," [ 42 54000]\n"," [ 30 135000]\n"," [ 52 114000]\n"," [ 50 36000]\n"," [ 56 133000]\n"," [ 29 61000]\n"," [ 30 89000]\n"," [ 26 16000]\n"," [ 33 31000]\n"," [ 41 72000]\n"," [ 36 33000]\n"," [ 55 125000]\n"," [ 48 131000]\n"," [ 41 71000]\n"," [ 30 62000]\n"," [ 37 72000]\n"," [ 41 63000]\n"," [ 58 47000]\n"," [ 30 116000]\n"," [ 20 49000]\n"," [ 37 74000]\n"," [ 41 59000]\n"," [ 49 89000]\n"," [ 28 79000]\n"," [ 53 82000]\n"," [ 40 57000]\n"," [ 60 34000]\n"," [ 35 108000]\n"," [ 21 72000]\n"," [ 38 71000]\n"," [ 39 106000]\n"," [ 37 57000]\n"," [ 26 72000]\n"," [ 35 23000]\n"," [ 54 108000]\n"," [ 30 17000]\n"," [ 39 134000]\n"," [ 29 43000]\n"," [ 33 43000]\n"," [ 35 38000]\n"," [ 41 45000]\n"," [ 41 72000]\n"," [ 39 134000]\n"," [ 27 137000]\n"," [ 21 16000]\n"," [ 26 32000]\n"," [ 31 66000]\n"," [ 39 73000]\n"," [ 41 79000]\n"," [ 47 50000]\n"," [ 41 30000]\n"," [ 37 93000]\n"," [ 60 46000]\n"," [ 25 22000]\n"," [ 28 37000]\n"," [ 38 55000]\n"," [ 36 54000]\n"," [ 20 36000]\n"," [ 56 104000]\n"," [ 40 57000]\n"," [ 42 108000]\n"," [ 20 23000]\n"," [ 40 65000]\n"," [ 47 20000]\n"," [ 18 86000]\n"," [ 35 79000]\n"," [ 57 33000]\n"," [ 34 72000]\n"," [ 49 39000]\n"," [ 27 31000]\n"," [ 19 70000]\n"," [ 39 79000]\n"," [ 26 81000]\n"," [ 25 80000]\n"," [ 28 85000]\n"," [ 55 39000]\n"," [ 50 88000]\n"," [ 49 88000]\n"," [ 52 150000]\n"," [ 35 65000]\n"," [ 42 54000]\n"," [ 34 43000]\n"," [ 37 52000]\n"," [ 48 30000]\n"," [ 29 43000]\n"," [ 36 52000]\n"," [ 27 54000]\n"," [ 26 118000]]\n"],"name":"stdout"}]},{"cell_type":"code","metadata":{"id":"8dpDLojm1mVG","colab_type":"code","outputId":"4eaa18a3-6481-42bb-c409-7227565c7fe1","executionInfo":{"status":"ok","timestamp":1588269312368,"user_tz":-240,"elapsed":2059,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":171}},"source":["print(y_train)"],"execution_count":5,"outputs":[{"output_type":"stream","text":["[0 1 0 1 1 1 0 0 0 0 0 0 1 1 1 0 1 0 0 1 0 1 0 1 0 0 1 1 1 1 0 1 0 1 0 0 1\n"," 0 0 1 0 0 0 0 0 1 1 1 1 0 0 0 1 0 1 0 1 0 0 1 0 0 0 1 0 0 0 1 1 0 0 1 0 1\n"," 1 1 0 0 1 1 0 0 1 1 0 1 0 0 1 1 0 1 1 1 0 0 0 0 0 1 0 0 1 1 1 1 1 0 1 1 0\n"," 1 0 0 0 0 0 0 0 1 1 0 0 1 0 0 1 0 0 0 1 0 1 1 0 1 0 0 0 0 1 0 0 0 1 1 0 0\n"," 0 0 1 0 1 0 0 0 1 0 0 0 0 1 1 1 0 0 0 0 0 0 1 1 1 1 1 0 1 0 0 0 0 0 1 0 0\n"," 0 0 0 0 1 1 0 1 0 1 0 0 1 0 0 0 1 0 0 0 0 0 1 0 0 0 0 0 1 0 1 1 0 0 0 0 0\n"," 0 1 1 0 0 0 0 1 0 0 0 0 1 0 1 0 1 0 0 0 1 0 0 0 1 0 1 0 0 0 0 0 1 1 0 0 0\n"," 0 0 1 0 1 1 0 0 0 0 0 1 0 1 0 0 1 0 0 1 0 1 0 0 0 0 0 0 1 1 1 1 0 0 0 0 1\n"," 0 0 0 0]\n"],"name":"stdout"}]},{"cell_type":"code","metadata":{"id":"qbb7i0DH1qui","colab_type":"code","outputId":"5c45ffab-4587-4828-8204-0f4fedf88980","executionInfo":{"status":"ok","timestamp":1588269312369,"user_tz":-240,"elapsed":2055,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":1000}},"source":["print(X_test)"],"execution_count":6,"outputs":[{"output_type":"stream","text":["[[ 30 87000]\n"," [ 38 50000]\n"," [ 35 75000]\n"," [ 30 79000]\n"," [ 35 50000]\n"," [ 27 20000]\n"," [ 31 15000]\n"," [ 36 144000]\n"," [ 18 68000]\n"," [ 47 43000]\n"," [ 30 49000]\n"," [ 28 55000]\n"," [ 37 55000]\n"," [ 39 77000]\n"," [ 20 86000]\n"," [ 32 117000]\n"," [ 37 77000]\n"," [ 19 85000]\n"," [ 55 130000]\n"," [ 35 22000]\n"," [ 35 47000]\n"," [ 47 144000]\n"," [ 41 51000]\n"," [ 47 105000]\n"," [ 23 28000]\n"," [ 49 141000]\n"," [ 28 87000]\n"," [ 29 80000]\n"," [ 37 62000]\n"," [ 32 86000]\n"," [ 21 88000]\n"," [ 37 79000]\n"," [ 57 60000]\n"," [ 37 53000]\n"," [ 24 58000]\n"," [ 18 52000]\n"," [ 22 81000]\n"," [ 34 43000]\n"," [ 31 34000]\n"," [ 49 36000]\n"," [ 27 88000]\n"," [ 41 52000]\n"," [ 27 84000]\n"," [ 35 20000]\n"," [ 43 112000]\n"," [ 27 58000]\n"," [ 37 80000]\n"," [ 52 90000]\n"," [ 26 30000]\n"," [ 49 86000]\n"," [ 57 122000]\n"," [ 34 25000]\n"," [ 35 57000]\n"," [ 34 115000]\n"," [ 59 88000]\n"," [ 45 32000]\n"," [ 29 83000]\n"," [ 26 80000]\n"," [ 49 28000]\n"," [ 23 20000]\n"," [ 32 18000]\n"," [ 60 42000]\n"," [ 19 76000]\n"," [ 36 99000]\n"," [ 19 26000]\n"," [ 60 83000]\n"," [ 24 89000]\n"," [ 27 58000]\n"," [ 40 47000]\n"," [ 42 70000]\n"," [ 32 150000]\n"," [ 35 77000]\n"," [ 22 63000]\n"," [ 45 22000]\n"," [ 27 89000]\n"," [ 18 82000]\n"," [ 42 79000]\n"," [ 40 60000]\n"," [ 53 34000]\n"," [ 47 107000]\n"," [ 58 144000]\n"," [ 59 83000]\n"," [ 24 55000]\n"," [ 26 35000]\n"," [ 58 38000]\n"," [ 42 80000]\n"," [ 40 75000]\n"," [ 59 130000]\n"," [ 46 41000]\n"," [ 41 60000]\n"," [ 42 64000]\n"," [ 37 146000]\n"," [ 23 48000]\n"," [ 25 33000]\n"," [ 24 84000]\n"," [ 27 96000]\n"," [ 23 63000]\n"," [ 48 33000]\n"," [ 48 90000]\n"," [ 42 104000]]\n"],"name":"stdout"}]},{"cell_type":"code","metadata":{"id":"kj1hnFAR1s5w","colab_type":"code","outputId":"984874ad-447c-441b-decb-3c775d9d7936","executionInfo":{"status":"ok","timestamp":1588269312369,"user_tz":-240,"elapsed":2051,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":68}},"source":["print(y_test)"],"execution_count":7,"outputs":[{"output_type":"stream","text":["[0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 0 0 1 0 1 0 1 0 0 0 0 0 1 1 0 0 0 0\n"," 0 0 1 0 0 0 0 1 0 0 1 0 1 1 0 0 0 1 1 0 0 1 0 0 1 0 1 0 1 0 0 0 0 1 0 0 1\n"," 0 0 0 0 1 1 1 0 0 0 1 1 0 1 1 0 0 1 0 0 0 1 0 1 1 1]\n"],"name":"stdout"}]},{"cell_type":"markdown","metadata":{"id":"kW3c7UYih0hT","colab_type":"text"},"source":["## Feature Scaling"]},{"cell_type":"code","metadata":{"id":"9fQlDPKCh8sc","colab_type":"code","colab":{}},"source":["from sklearn.preprocessing import StandardScaler\n","sc = StandardScaler()\n","X_train = sc.fit_transform(X_train)\n","X_test = sc.transform(X_test)"],"execution_count":0,"outputs":[]},{"cell_type":"code","metadata":{"id":"syrnD1Op2BSR","colab_type":"code","outputId":"c71d71b1-d8b6-4391-dee4-6f8e48b848c2","executionInfo":{"status":"ok","timestamp":1588269312370,"user_tz":-240,"elapsed":2046,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":1000}},"source":["print(X_train)"],"execution_count":9,"outputs":[{"output_type":"stream","text":["[[ 0.58164944 -0.88670699]\n"," [-0.60673761 1.46173768]\n"," [-0.01254409 -0.5677824 ]\n"," [-0.60673761 1.89663484]\n"," [ 1.37390747 -1.40858358]\n"," [ 1.47293972 0.99784738]\n"," [ 0.08648817 -0.79972756]\n"," [-0.01254409 -0.24885782]\n"," [-0.21060859 -0.5677824 ]\n"," [-0.21060859 -0.19087153]\n"," [-0.30964085 -1.29261101]\n"," [-0.30964085 -0.5677824 ]\n"," [ 0.38358493 0.09905991]\n"," [ 0.8787462 -0.59677555]\n"," [ 2.06713324 -1.17663843]\n"," [ 1.07681071 -0.13288524]\n"," [ 0.68068169 1.78066227]\n"," [-0.70576986 0.56295021]\n"," [ 0.77971394 0.35999821]\n"," [ 0.8787462 -0.53878926]\n"," [-1.20093113 -1.58254245]\n"," [ 2.1661655 0.93986109]\n"," [-0.01254409 1.22979253]\n"," [ 0.18552042 1.08482681]\n"," [ 0.38358493 -0.48080297]\n"," [-0.30964085 -0.30684411]\n"," [ 0.97777845 -0.8287207 ]\n"," [ 0.97777845 1.8676417 ]\n"," [-0.01254409 1.25878567]\n"," [-0.90383437 2.27354572]\n"," [-1.20093113 -1.58254245]\n"," [ 2.1661655 -0.79972756]\n"," [-1.39899564 -1.46656987]\n"," [ 0.38358493 2.30253886]\n"," [ 0.77971394 0.76590222]\n"," [-1.00286662 -0.30684411]\n"," [ 0.08648817 0.76590222]\n"," [-1.00286662 0.56295021]\n"," [ 0.28455268 0.07006676]\n"," [ 0.68068169 -1.26361786]\n"," [-0.50770535 -0.01691267]\n"," [-1.79512465 0.35999821]\n"," [-0.70576986 0.12805305]\n"," [ 0.38358493 0.30201192]\n"," [-0.30964085 0.07006676]\n"," [-0.50770535 2.30253886]\n"," [ 0.18552042 0.04107362]\n"," [ 1.27487521 2.21555943]\n"," [ 0.77971394 0.27301877]\n"," [-0.30964085 0.1570462 ]\n"," [-0.01254409 -0.53878926]\n"," [-0.21060859 0.1570462 ]\n"," [-0.11157634 0.24402563]\n"," [-0.01254409 -0.24885782]\n"," [ 2.1661655 1.11381995]\n"," [-1.79512465 0.35999821]\n"," [ 1.86906873 0.12805305]\n"," [ 0.38358493 -0.13288524]\n"," [-1.20093113 0.30201192]\n"," [ 0.77971394 1.37475825]\n"," [-0.30964085 -0.24885782]\n"," [-1.6960924 -0.04590581]\n"," [-1.00286662 -0.74174127]\n"," [ 0.28455268 0.50496393]\n"," [-0.11157634 -1.06066585]\n"," [-1.10189888 0.59194336]\n"," [ 0.08648817 -0.79972756]\n"," [-1.00286662 1.54871711]\n"," [-0.70576986 1.40375139]\n"," [-1.29996338 0.50496393]\n"," [-0.30964085 0.04107362]\n"," [-0.11157634 0.01208048]\n"," [-0.30964085 -0.88670699]\n"," [ 0.8787462 -1.3505973 ]\n"," [-0.30964085 2.24455257]\n"," [ 0.97777845 1.98361427]\n"," [-1.20093113 0.47597078]\n"," [-1.29996338 0.27301877]\n"," [ 1.37390747 1.98361427]\n"," [ 1.27487521 -1.3505973 ]\n"," [-0.30964085 -0.27785096]\n"," [-0.50770535 1.25878567]\n"," [-0.80480212 1.08482681]\n"," [ 0.97777845 -1.06066585]\n"," [ 0.28455268 0.30201192]\n"," [ 0.97777845 0.76590222]\n"," [-0.70576986 -1.49556302]\n"," [-0.70576986 0.04107362]\n"," [ 0.48261718 1.72267598]\n"," [ 2.06713324 0.18603934]\n"," [-1.99318916 -0.74174127]\n"," [-0.21060859 1.40375139]\n"," [ 0.38358493 0.59194336]\n"," [ 0.8787462 -1.14764529]\n"," [-1.20093113 -0.77073441]\n"," [ 0.18552042 0.24402563]\n"," [ 0.77971394 -0.30684411]\n"," [ 2.06713324 -0.79972756]\n"," [ 0.77971394 0.12805305]\n"," [-0.30964085 0.6209365 ]\n"," [-1.00286662 -0.30684411]\n"," [ 0.18552042 -0.3648304 ]\n"," [ 2.06713324 2.12857999]\n"," [ 1.86906873 -1.26361786]\n"," [ 1.37390747 -0.91570013]\n"," [ 0.8787462 1.25878567]\n"," [ 1.47293972 2.12857999]\n"," [-0.30964085 -1.23462472]\n"," [ 1.96810099 0.91086794]\n"," [ 0.68068169 -0.71274813]\n"," [-1.49802789 0.35999821]\n"," [ 0.77971394 -1.3505973 ]\n"," [ 0.38358493 -0.13288524]\n"," [-1.00286662 0.41798449]\n"," [-0.01254409 -0.30684411]\n"," [-1.20093113 0.41798449]\n"," [-0.90383437 -1.20563157]\n"," [-0.11157634 0.04107362]\n"," [-1.59706014 -0.42281668]\n"," [ 0.97777845 -1.00267957]\n"," [ 1.07681071 -1.20563157]\n"," [-0.01254409 -0.13288524]\n"," [-1.10189888 -1.52455616]\n"," [ 0.77971394 -1.20563157]\n"," [ 0.97777845 2.07059371]\n"," [-1.20093113 -1.52455616]\n"," [-0.30964085 0.79489537]\n"," [ 0.08648817 -0.30684411]\n"," [-1.39899564 -1.23462472]\n"," [-0.60673761 -1.49556302]\n"," [ 0.77971394 0.53395707]\n"," [-0.30964085 -0.33583725]\n"," [ 1.77003648 -0.27785096]\n"," [ 0.8787462 -1.03167271]\n"," [ 0.18552042 0.07006676]\n"," [-0.60673761 0.8818748 ]\n"," [-1.89415691 -1.40858358]\n"," [-1.29996338 0.59194336]\n"," [-0.30964085 0.53395707]\n"," [-1.00286662 -1.089659 ]\n"," [ 1.17584296 -1.43757673]\n"," [ 0.18552042 -0.30684411]\n"," [ 1.17584296 -0.74174127]\n"," [-0.30964085 0.07006676]\n"," [ 0.18552042 2.09958685]\n"," [ 0.77971394 -1.089659 ]\n"," [ 0.08648817 0.04107362]\n"," [-1.79512465 0.12805305]\n"," [-0.90383437 0.1570462 ]\n"," [-0.70576986 0.18603934]\n"," [ 0.8787462 -1.29261101]\n"," [ 0.18552042 -0.24885782]\n"," [-0.4086731 1.22979253]\n"," [-0.01254409 0.30201192]\n"," [ 0.38358493 0.1570462 ]\n"," [ 0.8787462 -0.65476184]\n"," [ 0.08648817 0.1570462 ]\n"," [-1.89415691 -1.29261101]\n"," [-0.11157634 0.30201192]\n"," [-0.21060859 -0.27785096]\n"," [ 0.28455268 -0.50979612]\n"," [-0.21060859 1.6067034 ]\n"," [ 0.97777845 -1.17663843]\n"," [-0.21060859 1.63569655]\n"," [ 1.27487521 1.8676417 ]\n"," [-1.10189888 -0.3648304 ]\n"," [-0.01254409 0.04107362]\n"," [ 0.08648817 -0.24885782]\n"," [-1.59706014 -1.23462472]\n"," [-0.50770535 -0.27785096]\n"," [ 0.97777845 0.12805305]\n"," [ 1.96810099 -1.3505973 ]\n"," [ 1.47293972 0.07006676]\n"," [-0.60673761 1.37475825]\n"," [ 1.57197197 0.01208048]\n"," [-0.80480212 0.30201192]\n"," [ 1.96810099 0.73690908]\n"," [-1.20093113 -0.50979612]\n"," [ 0.68068169 0.27301877]\n"," [-1.39899564 -0.42281668]\n"," [ 0.18552042 0.1570462 ]\n"," [-0.50770535 -1.20563157]\n"," [ 0.58164944 2.01260742]\n"," [-1.59706014 -1.49556302]\n"," [-0.50770535 -0.53878926]\n"," [ 0.48261718 1.83864855]\n"," [-1.39899564 -1.089659 ]\n"," [ 0.77971394 -1.37959044]\n"," [-0.30964085 -0.42281668]\n"," [ 1.57197197 0.99784738]\n"," [ 0.97777845 1.43274454]\n"," [-0.30964085 -0.48080297]\n"," [-0.11157634 2.15757314]\n"," [-1.49802789 -0.1038921 ]\n"," [-0.11157634 1.95462113]\n"," [-0.70576986 -0.33583725]\n"," [-0.50770535 -0.8287207 ]\n"," [ 0.68068169 -1.37959044]\n"," [-0.80480212 -1.58254245]\n"," [-1.89415691 -1.46656987]\n"," [ 1.07681071 0.12805305]\n"," [ 0.08648817 1.51972397]\n"," [-0.30964085 0.09905991]\n"," [ 0.08648817 0.04107362]\n"," [-1.39899564 -1.3505973 ]\n"," [ 0.28455268 0.07006676]\n"," [-0.90383437 0.38899135]\n"," [ 1.57197197 -1.26361786]\n"," [-0.30964085 -0.74174127]\n"," [-0.11157634 0.1570462 ]\n"," [-0.90383437 -0.65476184]\n"," [-0.70576986 -0.04590581]\n"," [ 0.38358493 -0.45180983]\n"," [-0.80480212 1.89663484]\n"," [ 1.37390747 1.28777882]\n"," [ 1.17584296 -0.97368642]\n"," [ 1.77003648 1.83864855]\n"," [-0.90383437 -0.24885782]\n"," [-0.80480212 0.56295021]\n"," [-1.20093113 -1.5535493 ]\n"," [-0.50770535 -1.11865214]\n"," [ 0.28455268 0.07006676]\n"," [-0.21060859 -1.06066585]\n"," [ 1.67100423 1.6067034 ]\n"," [ 0.97777845 1.78066227]\n"," [ 0.28455268 0.04107362]\n"," [-0.80480212 -0.21986468]\n"," [-0.11157634 0.07006676]\n"," [ 0.28455268 -0.19087153]\n"," [ 1.96810099 -0.65476184]\n"," [-0.80480212 1.3457651 ]\n"," [-1.79512465 -0.59677555]\n"," [-0.11157634 0.12805305]\n"," [ 0.28455268 -0.30684411]\n"," [ 1.07681071 0.56295021]\n"," [-1.00286662 0.27301877]\n"," [ 1.47293972 0.35999821]\n"," [ 0.18552042 -0.3648304 ]\n"," [ 2.1661655 -1.03167271]\n"," [-0.30964085 1.11381995]\n"," [-1.6960924 0.07006676]\n"," [-0.01254409 0.04107362]\n"," [ 0.08648817 1.05583366]\n"," [-0.11157634 -0.3648304 ]\n"," [-1.20093113 0.07006676]\n"," [-0.30964085 -1.3505973 ]\n"," [ 1.57197197 1.11381995]\n"," [-0.80480212 -1.52455616]\n"," [ 0.08648817 1.8676417 ]\n"," [-0.90383437 -0.77073441]\n"," [-0.50770535 -0.77073441]\n"," [-0.30964085 -0.91570013]\n"," [ 0.28455268 -0.71274813]\n"," [ 0.28455268 0.07006676]\n"," [ 0.08648817 1.8676417 ]\n"," [-1.10189888 1.95462113]\n"," [-1.6960924 -1.5535493 ]\n"," [-1.20093113 -1.089659 ]\n"," [-0.70576986 -0.1038921 ]\n"," [ 0.08648817 0.09905991]\n"," [ 0.28455268 0.27301877]\n"," [ 0.8787462 -0.5677824 ]\n"," [ 0.28455268 -1.14764529]\n"," [-0.11157634 0.67892279]\n"," [ 2.1661655 -0.68375498]\n"," [-1.29996338 -1.37959044]\n"," [-1.00286662 -0.94469328]\n"," [-0.01254409 -0.42281668]\n"," [-0.21060859 -0.45180983]\n"," [-1.79512465 -0.97368642]\n"," [ 1.77003648 0.99784738]\n"," [ 0.18552042 -0.3648304 ]\n"," [ 0.38358493 1.11381995]\n"," [-1.79512465 -1.3505973 ]\n"," [ 0.18552042 -0.13288524]\n"," [ 0.8787462 -1.43757673]\n"," [-1.99318916 0.47597078]\n"," [-0.30964085 0.27301877]\n"," [ 1.86906873 -1.06066585]\n"," [-0.4086731 0.07006676]\n"," [ 1.07681071 -0.88670699]\n"," [-1.10189888 -1.11865214]\n"," [-1.89415691 0.01208048]\n"," [ 0.08648817 0.27301877]\n"," [-1.20093113 0.33100506]\n"," [-1.29996338 0.30201192]\n"," [-1.00286662 0.44697764]\n"," [ 1.67100423 -0.88670699]\n"," [ 1.17584296 0.53395707]\n"," [ 1.07681071 0.53395707]\n"," [ 1.37390747 2.331532 ]\n"," [-0.30964085 -0.13288524]\n"," [ 0.38358493 -0.45180983]\n"," [-0.4086731 -0.77073441]\n"," [-0.11157634 -0.50979612]\n"," [ 0.97777845 -1.14764529]\n"," [-0.90383437 -0.77073441]\n"," [-0.21060859 -0.50979612]\n"," [-1.10189888 -0.45180983]\n"," [-1.20093113 1.40375139]]\n"],"name":"stdout"}]},{"cell_type":"code","metadata":{"id":"JUd6iBRp2C3L","colab_type":"code","outputId":"5762f294-8c56-4d79-c441-3468e2cb5e6a","executionInfo":{"status":"ok","timestamp":1588269312370,"user_tz":-240,"elapsed":2041,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":1000}},"source":["print(X_test)"],"execution_count":10,"outputs":[{"output_type":"stream","text":["[[-0.80480212 0.50496393]\n"," [-0.01254409 -0.5677824 ]\n"," [-0.30964085 0.1570462 ]\n"," [-0.80480212 0.27301877]\n"," [-0.30964085 -0.5677824 ]\n"," [-1.10189888 -1.43757673]\n"," [-0.70576986 -1.58254245]\n"," [-0.21060859 2.15757314]\n"," [-1.99318916 -0.04590581]\n"," [ 0.8787462 -0.77073441]\n"," [-0.80480212 -0.59677555]\n"," [-1.00286662 -0.42281668]\n"," [-0.11157634 -0.42281668]\n"," [ 0.08648817 0.21503249]\n"," [-1.79512465 0.47597078]\n"," [-0.60673761 1.37475825]\n"," [-0.11157634 0.21503249]\n"," [-1.89415691 0.44697764]\n"," [ 1.67100423 1.75166912]\n"," [-0.30964085 -1.37959044]\n"," [-0.30964085 -0.65476184]\n"," [ 0.8787462 2.15757314]\n"," [ 0.28455268 -0.53878926]\n"," [ 0.8787462 1.02684052]\n"," [-1.49802789 -1.20563157]\n"," [ 1.07681071 2.07059371]\n"," [-1.00286662 0.50496393]\n"," [-0.90383437 0.30201192]\n"," [-0.11157634 -0.21986468]\n"," [-0.60673761 0.47597078]\n"," [-1.6960924 0.53395707]\n"," [-0.11157634 0.27301877]\n"," [ 1.86906873 -0.27785096]\n"," [-0.11157634 -0.48080297]\n"," [-1.39899564 -0.33583725]\n"," [-1.99318916 -0.50979612]\n"," [-1.59706014 0.33100506]\n"," [-0.4086731 -0.77073441]\n"," [-0.70576986 -1.03167271]\n"," [ 1.07681071 -0.97368642]\n"," [-1.10189888 0.53395707]\n"," [ 0.28455268 -0.50979612]\n"," [-1.10189888 0.41798449]\n"," [-0.30964085 -1.43757673]\n"," [ 0.48261718 1.22979253]\n"," [-1.10189888 -0.33583725]\n"," [-0.11157634 0.30201192]\n"," [ 1.37390747 0.59194336]\n"," [-1.20093113 -1.14764529]\n"," [ 1.07681071 0.47597078]\n"," [ 1.86906873 1.51972397]\n"," [-0.4086731 -1.29261101]\n"," [-0.30964085 -0.3648304 ]\n"," [-0.4086731 1.31677196]\n"," [ 2.06713324 0.53395707]\n"," [ 0.68068169 -1.089659 ]\n"," [-0.90383437 0.38899135]\n"," [-1.20093113 0.30201192]\n"," [ 1.07681071 -1.20563157]\n"," [-1.49802789 -1.43757673]\n"," [-0.60673761 -1.49556302]\n"," [ 2.1661655 -0.79972756]\n"," [-1.89415691 0.18603934]\n"," [-0.21060859 0.85288166]\n"," [-1.89415691 -1.26361786]\n"," [ 2.1661655 0.38899135]\n"," [-1.39899564 0.56295021]\n"," [-1.10189888 -0.33583725]\n"," [ 0.18552042 -0.65476184]\n"," [ 0.38358493 0.01208048]\n"," [-0.60673761 2.331532 ]\n"," [-0.30964085 0.21503249]\n"," [-1.59706014 -0.19087153]\n"," [ 0.68068169 -1.37959044]\n"," [-1.10189888 0.56295021]\n"," [-1.99318916 0.35999821]\n"," [ 0.38358493 0.27301877]\n"," [ 0.18552042 -0.27785096]\n"," [ 1.47293972 -1.03167271]\n"," [ 0.8787462 1.08482681]\n"," [ 1.96810099 2.15757314]\n"," [ 2.06713324 0.38899135]\n"," [-1.39899564 -0.42281668]\n"," [-1.20093113 -1.00267957]\n"," [ 1.96810099 -0.91570013]\n"," [ 0.38358493 0.30201192]\n"," [ 0.18552042 0.1570462 ]\n"," [ 2.06713324 1.75166912]\n"," [ 0.77971394 -0.8287207 ]\n"," [ 0.28455268 -0.27785096]\n"," [ 0.38358493 -0.16187839]\n"," [-0.11157634 2.21555943]\n"," [-1.49802789 -0.62576869]\n"," [-1.29996338 -1.06066585]\n"," [-1.39899564 0.41798449]\n"," [-1.10189888 0.76590222]\n"," [-1.49802789 -0.19087153]\n"," [ 0.97777845 -1.06066585]\n"," [ 0.97777845 0.59194336]\n"," [ 0.38358493 0.99784738]]\n"],"name":"stdout"}]},{"cell_type":"markdown","metadata":{"id":"bb6jCOCQiAmP","colab_type":"text"},"source":["## Training the Decision Tree Classification model on the Training set"]},{"cell_type":"code","metadata":{"id":"e0pFVAmciHQs","colab_type":"code","outputId":"1a9b0904-ea86-40d9-bca2-a28fdf00d56d","executionInfo":{"status":"ok","timestamp":1588269312370,"user_tz":-240,"elapsed":2037,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":120}},"source":["from sklearn.tree import DecisionTreeClassifier\n","classifier = DecisionTreeClassifier(criterion = 'entropy', random_state = 0)\n","classifier.fit(X_train, y_train)"],"execution_count":11,"outputs":[{"output_type":"execute_result","data":{"text/plain":["DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='entropy',\n"," max_depth=None, max_features=None, max_leaf_nodes=None,\n"," min_impurity_decrease=0.0, min_impurity_split=None,\n"," min_samples_leaf=1, min_samples_split=2,\n"," min_weight_fraction_leaf=0.0, presort='deprecated',\n"," random_state=0, splitter='best')"]},"metadata":{"tags":[]},"execution_count":11}]},{"cell_type":"markdown","metadata":{"id":"yyxW5b395mR2","colab_type":"text"},"source":["## Predicting a new result"]},{"cell_type":"code","metadata":{"id":"f8YOXsQy58rP","colab_type":"code","outputId":"cd4b80f5-59ad-40b1-d5f3-8fc98b87bd66","executionInfo":{"status":"ok","timestamp":1588269312371,"user_tz":-240,"elapsed":2034,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":34}},"source":["print(classifier.predict(sc.transform([[30,87000]])))"],"execution_count":12,"outputs":[{"output_type":"stream","text":["[0]\n"],"name":"stdout"}]},{"cell_type":"markdown","metadata":{"id":"vKYVQH-l5NpE","colab_type":"text"},"source":["## Predicting the Test set results"]},{"cell_type":"code","metadata":{"id":"p6VMTb2O4hwM","colab_type":"code","outputId":"05404102-6c3b-4c34-a180-e2a1d5a85e57","executionInfo":{"status":"ok","timestamp":1588269312371,"user_tz":-240,"elapsed":2029,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":1000}},"source":["y_pred = classifier.predict(X_test)\n","print(np.concatenate((y_pred.reshape(len(y_pred),1), y_test.reshape(len(y_test),1)),1))"],"execution_count":13,"outputs":[{"output_type":"stream","text":["[[0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 0]\n"," [0 0]\n"," [1 0]\n"," [1 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 1]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [1 1]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 0]\n"," [1 1]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [1 1]\n"," [1 1]\n"," [1 0]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 1]\n"," [0 0]\n"," [1 1]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [0 0]\n"," [0 0]\n"," [1 1]\n"," [0 0]\n"," [1 1]\n"," [1 1]\n"," [1 1]]\n"],"name":"stdout"}]},{"cell_type":"markdown","metadata":{"id":"h4Hwj34ziWQW","colab_type":"text"},"source":["## Making the Confusion Matrix"]},{"cell_type":"code","metadata":{"id":"D6bpZwUiiXic","colab_type":"code","outputId":"031d8132-ae7a-4a4c-b2dd-26b88da40ed6","executionInfo":{"status":"ok","timestamp":1588269312371,"user_tz":-240,"elapsed":2026,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":68}},"source":["from sklearn.metrics import confusion_matrix, accuracy_score\n","cm = confusion_matrix(y_test, y_pred)\n","print(cm)\n","accuracy_score(y_test, y_pred)"],"execution_count":14,"outputs":[{"output_type":"stream","text":["[[62 6]\n"," [ 3 29]]\n"],"name":"stdout"},{"output_type":"execute_result","data":{"text/plain":["0.91"]},"metadata":{"tags":[]},"execution_count":14}]},{"cell_type":"markdown","metadata":{"id":"6OMC_P0diaoD","colab_type":"text"},"source":["## Visualising the Training set results"]},{"cell_type":"code","metadata":{"id":"_NOjKvZRid5l","colab_type":"code","outputId":"cd4f51f4-8260-40bf-aa20-e238d60ccc1e","executionInfo":{"status":"ok","timestamp":1588269340691,"user_tz":-240,"elapsed":30339,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":349}},"source":["from matplotlib.colors import ListedColormap\n","X_set, y_set = sc.inverse_transform(X_train), y_train\n","X1, X2 = np.meshgrid(np.arange(start = X_set[:, 0].min() - 10, stop = X_set[:, 0].max() + 10, step = 0.25),\n"," np.arange(start = X_set[:, 1].min() - 1000, stop = X_set[:, 1].max() + 1000, step = 0.25))\n","plt.contourf(X1, X2, classifier.predict(sc.transform(np.array([X1.ravel(), X2.ravel()]).T)).reshape(X1.shape),\n"," alpha = 0.75, cmap = ListedColormap(('red', 'green')))\n","plt.xlim(X1.min(), X1.max())\n","plt.ylim(X2.min(), X2.max())\n","for i, j in enumerate(np.unique(y_set)):\n"," plt.scatter(X_set[y_set == j, 0], X_set[y_set == j, 1], c = ListedColormap(('red', 'green'))(i), label = j)\n","plt.title('Decision Tree Classification (Training set)')\n","plt.xlabel('Age')\n","plt.ylabel('Estimated Salary')\n","plt.legend()\n","plt.show()"],"execution_count":15,"outputs":[{"output_type":"stream","text":["'c' argument looks like a single numeric RGB or RGBA sequence, which should be avoided as value-mapping will have precedence in case its length matches with 'x' & 'y'. Please use a 2-D array with a single row if you really want to specify the same RGB or RGBA value for all points.\n","'c' argument looks like a single numeric RGB or RGBA sequence, which should be avoided as value-mapping will have precedence in case its length matches with 'x' & 'y'. Please use a 2-D array with a single row if you really want to specify the same RGB or RGBA value for all points.\n"],"name":"stderr"},{"output_type":"display_data","data":{"image/png":"\n","text/plain":["
"]},"metadata":{"tags":[],"needs_background":"light"}}]},{"cell_type":"markdown","metadata":{"id":"SZ-j28aPihZx","colab_type":"text"},"source":["## Visualising the Test set results"]},{"cell_type":"code","metadata":{"id":"qeTjz2vDilAC","colab_type":"code","outputId":"c9624a3f-544e-4033-8cb8-bb4b7b08ff4a","executionInfo":{"status":"ok","timestamp":1588269365372,"user_tz":-240,"elapsed":55016,"user":{"displayName":"Hadelin de Ponteves","photoUrl":"https://lh3.googleusercontent.com/a-/AOh14GhEuXdT7eQweUmRPW8_laJuPggSK6hfvpl5a6WBaA=s64","userId":"15047218817161520419"}},"colab":{"base_uri":"https://localhost:8080/","height":349}},"source":["from matplotlib.colors import ListedColormap\n","X_set, y_set = sc.inverse_transform(X_test), y_test\n","X1, X2 = np.meshgrid(np.arange(start = X_set[:, 0].min() - 10, stop = X_set[:, 0].max() + 10, step = 0.25),\n"," np.arange(start = X_set[:, 1].min() - 1000, stop = X_set[:, 1].max() + 1000, step = 0.25))\n","plt.contourf(X1, X2, classifier.predict(sc.transform(np.array([X1.ravel(), X2.ravel()]).T)).reshape(X1.shape),\n"," alpha = 0.75, cmap = ListedColormap(('red', 'green')))\n","plt.xlim(X1.min(), X1.max())\n","plt.ylim(X2.min(), X2.max())\n","for i, j in enumerate(np.unique(y_set)):\n"," plt.scatter(X_set[y_set == j, 0], X_set[y_set == j, 1], c = ListedColormap(('red', 'green'))(i), label = j)\n","plt.title('Decision Tree Classification (Test set)')\n","plt.xlabel('Age')\n","plt.ylabel('Estimated Salary')\n","plt.legend()\n","plt.show()"],"execution_count":16,"outputs":[{"output_type":"stream","text":["'c' argument looks like a single numeric RGB or RGBA sequence, which should be avoided as value-mapping will have precedence in case its length matches with 'x' & 'y'. Please use a 2-D array with a single row if you really want to specify the same RGB or RGBA value for all points.\n","'c' argument looks like a single numeric RGB or RGBA sequence, which should be avoided as value-mapping will have precedence in case its length matches with 'x' & 'y'. Please use a 2-D array with a single row if you really want to specify the same RGB or RGBA value for all points.\n"],"name":"stderr"},{"output_type":"display_data","data":{"image/png":"\n","text/plain":["
"]},"metadata":{"tags":[],"needs_background":"light"}}]}]} \ No newline at end of file +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "machine_shape": "hm" + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + } + }, + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "0MRC0e0KhQ0S" + }, + "source": [ + "# Decision Tree Classification" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "LWd1UlMnhT2s" + }, + "source": [ + "## Importing the libraries" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "YvGPUQaHhXfL" + }, + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import pandas as pd" + ], + "execution_count": 2, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "K1VMqkGvhc3-" + }, + "source": [ + "## Importing the dataset" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "M52QDmyzhh9s" + }, + "source": [ + "dataset = pd.read_csv('Social_Network_Ads.csv')\n", + "X = dataset.iloc[:, :-1].values\n", + "y = dataset.iloc[:, -1].values" + ], + "execution_count": 3, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "YvxIPVyMhmKp" + }, + "source": [ + "## Splitting the dataset into the Training set and Test set" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "AVzJWAXIhxoC" + }, + "source": [ + "from sklearn.model_selection import train_test_split\n", + "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.25, random_state = 0)" + ], + "execution_count": 4, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "P3nS3-6r1i2B", + "outputId": "2e85a365-02cc-49dc-981e-d67fd641090a", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(X_train)" + ], + "execution_count": 5, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[ 44 39000]\n", + " [ 32 120000]\n", + " [ 38 50000]\n", + " [ 32 135000]\n", + " [ 52 21000]\n", + " [ 53 104000]\n", + " [ 39 42000]\n", + " [ 38 61000]\n", + " [ 36 50000]\n", + " [ 36 63000]\n", + " [ 35 25000]\n", + " [ 35 50000]\n", + " [ 42 73000]\n", + " [ 47 49000]\n", + " [ 59 29000]\n", + " [ 49 65000]\n", + " [ 45 131000]\n", + " [ 31 89000]\n", + " [ 46 82000]\n", + " [ 47 51000]\n", + " [ 26 15000]\n", + " [ 60 102000]\n", + " [ 38 112000]\n", + " [ 40 107000]\n", + " [ 42 53000]\n", + " [ 35 59000]\n", + " [ 48 41000]\n", + " [ 48 134000]\n", + " [ 38 113000]\n", + " [ 29 148000]\n", + " [ 26 15000]\n", + " [ 60 42000]\n", + " [ 24 19000]\n", + " [ 42 149000]\n", + " [ 46 96000]\n", + " [ 28 59000]\n", + " [ 39 96000]\n", + " [ 28 89000]\n", + " [ 41 72000]\n", + " [ 45 26000]\n", + " [ 33 69000]\n", + " [ 20 82000]\n", + " [ 31 74000]\n", + " [ 42 80000]\n", + " [ 35 72000]\n", + " [ 33 149000]\n", + " [ 40 71000]\n", + " [ 51 146000]\n", + " [ 46 79000]\n", + " [ 35 75000]\n", + " [ 38 51000]\n", + " [ 36 75000]\n", + " [ 37 78000]\n", + " [ 38 61000]\n", + " [ 60 108000]\n", + " [ 20 82000]\n", + " [ 57 74000]\n", + " [ 42 65000]\n", + " [ 26 80000]\n", + " [ 46 117000]\n", + " [ 35 61000]\n", + " [ 21 68000]\n", + " [ 28 44000]\n", + " [ 41 87000]\n", + " [ 37 33000]\n", + " [ 27 90000]\n", + " [ 39 42000]\n", + " [ 28 123000]\n", + " [ 31 118000]\n", + " [ 25 87000]\n", + " [ 35 71000]\n", + " [ 37 70000]\n", + " [ 35 39000]\n", + " [ 47 23000]\n", + " [ 35 147000]\n", + " [ 48 138000]\n", + " [ 26 86000]\n", + " [ 25 79000]\n", + " [ 52 138000]\n", + " [ 51 23000]\n", + " [ 35 60000]\n", + " [ 33 113000]\n", + " [ 30 107000]\n", + " [ 48 33000]\n", + " [ 41 80000]\n", + " [ 48 96000]\n", + " [ 31 18000]\n", + " [ 31 71000]\n", + " [ 43 129000]\n", + " [ 59 76000]\n", + " [ 18 44000]\n", + " [ 36 118000]\n", + " [ 42 90000]\n", + " [ 47 30000]\n", + " [ 26 43000]\n", + " [ 40 78000]\n", + " [ 46 59000]\n", + " [ 59 42000]\n", + " [ 46 74000]\n", + " [ 35 91000]\n", + " [ 28 59000]\n", + " [ 40 57000]\n", + " [ 59 143000]\n", + " [ 57 26000]\n", + " [ 52 38000]\n", + " [ 47 113000]\n", + " [ 53 143000]\n", + " [ 35 27000]\n", + " [ 58 101000]\n", + " [ 45 45000]\n", + " [ 23 82000]\n", + " [ 46 23000]\n", + " [ 42 65000]\n", + " [ 28 84000]\n", + " [ 38 59000]\n", + " [ 26 84000]\n", + " [ 29 28000]\n", + " [ 37 71000]\n", + " [ 22 55000]\n", + " [ 48 35000]\n", + " [ 49 28000]\n", + " [ 38 65000]\n", + " [ 27 17000]\n", + " [ 46 28000]\n", + " [ 48 141000]\n", + " [ 26 17000]\n", + " [ 35 97000]\n", + " [ 39 59000]\n", + " [ 24 27000]\n", + " [ 32 18000]\n", + " [ 46 88000]\n", + " [ 35 58000]\n", + " [ 56 60000]\n", + " [ 47 34000]\n", + " [ 40 72000]\n", + " [ 32 100000]\n", + " [ 19 21000]\n", + " [ 25 90000]\n", + " [ 35 88000]\n", + " [ 28 32000]\n", + " [ 50 20000]\n", + " [ 40 59000]\n", + " [ 50 44000]\n", + " [ 35 72000]\n", + " [ 40 142000]\n", + " [ 46 32000]\n", + " [ 39 71000]\n", + " [ 20 74000]\n", + " [ 29 75000]\n", + " [ 31 76000]\n", + " [ 47 25000]\n", + " [ 40 61000]\n", + " [ 34 112000]\n", + " [ 38 80000]\n", + " [ 42 75000]\n", + " [ 47 47000]\n", + " [ 39 75000]\n", + " [ 19 25000]\n", + " [ 37 80000]\n", + " [ 36 60000]\n", + " [ 41 52000]\n", + " [ 36 125000]\n", + " [ 48 29000]\n", + " [ 36 126000]\n", + " [ 51 134000]\n", + " [ 27 57000]\n", + " [ 38 71000]\n", + " [ 39 61000]\n", + " [ 22 27000]\n", + " [ 33 60000]\n", + " [ 48 74000]\n", + " [ 58 23000]\n", + " [ 53 72000]\n", + " [ 32 117000]\n", + " [ 54 70000]\n", + " [ 30 80000]\n", + " [ 58 95000]\n", + " [ 26 52000]\n", + " [ 45 79000]\n", + " [ 24 55000]\n", + " [ 40 75000]\n", + " [ 33 28000]\n", + " [ 44 139000]\n", + " [ 22 18000]\n", + " [ 33 51000]\n", + " [ 43 133000]\n", + " [ 24 32000]\n", + " [ 46 22000]\n", + " [ 35 55000]\n", + " [ 54 104000]\n", + " [ 48 119000]\n", + " [ 35 53000]\n", + " [ 37 144000]\n", + " [ 23 66000]\n", + " [ 37 137000]\n", + " [ 31 58000]\n", + " [ 33 41000]\n", + " [ 45 22000]\n", + " [ 30 15000]\n", + " [ 19 19000]\n", + " [ 49 74000]\n", + " [ 39 122000]\n", + " [ 35 73000]\n", + " [ 39 71000]\n", + " [ 24 23000]\n", + " [ 41 72000]\n", + " [ 29 83000]\n", + " [ 54 26000]\n", + " [ 35 44000]\n", + " [ 37 75000]\n", + " [ 29 47000]\n", + " [ 31 68000]\n", + " [ 42 54000]\n", + " [ 30 135000]\n", + " [ 52 114000]\n", + " [ 50 36000]\n", + " [ 56 133000]\n", + " [ 29 61000]\n", + " [ 30 89000]\n", + " [ 26 16000]\n", + " [ 33 31000]\n", + " [ 41 72000]\n", + " [ 36 33000]\n", + " [ 55 125000]\n", + " [ 48 131000]\n", + " [ 41 71000]\n", + " [ 30 62000]\n", + " [ 37 72000]\n", + " [ 41 63000]\n", + " [ 58 47000]\n", + " [ 30 116000]\n", + " [ 20 49000]\n", + " [ 37 74000]\n", + " [ 41 59000]\n", + " [ 49 89000]\n", + " [ 28 79000]\n", + " [ 53 82000]\n", + " [ 40 57000]\n", + " [ 60 34000]\n", + " [ 35 108000]\n", + " [ 21 72000]\n", + " [ 38 71000]\n", + " [ 39 106000]\n", + " [ 37 57000]\n", + " [ 26 72000]\n", + " [ 35 23000]\n", + " [ 54 108000]\n", + " [ 30 17000]\n", + " [ 39 134000]\n", + " [ 29 43000]\n", + " [ 33 43000]\n", + " [ 35 38000]\n", + " [ 41 45000]\n", + " [ 41 72000]\n", + " [ 39 134000]\n", + " [ 27 137000]\n", + " [ 21 16000]\n", + " [ 26 32000]\n", + " [ 31 66000]\n", + " [ 39 73000]\n", + " [ 41 79000]\n", + " [ 47 50000]\n", + " [ 41 30000]\n", + " [ 37 93000]\n", + " [ 60 46000]\n", + " [ 25 22000]\n", + " [ 28 37000]\n", + " [ 38 55000]\n", + " [ 36 54000]\n", + " [ 20 36000]\n", + " [ 56 104000]\n", + " [ 40 57000]\n", + " [ 42 108000]\n", + " [ 20 23000]\n", + " [ 40 65000]\n", + " [ 47 20000]\n", + " [ 18 86000]\n", + " [ 35 79000]\n", + " [ 57 33000]\n", + " [ 34 72000]\n", + " [ 49 39000]\n", + " [ 27 31000]\n", + " [ 19 70000]\n", + " [ 39 79000]\n", + " [ 26 81000]\n", + " [ 25 80000]\n", + " [ 28 85000]\n", + " [ 55 39000]\n", + " [ 50 88000]\n", + " [ 49 88000]\n", + " [ 52 150000]\n", + " [ 35 65000]\n", + " [ 42 54000]\n", + " [ 34 43000]\n", + " [ 37 52000]\n", + " [ 48 30000]\n", + " [ 29 43000]\n", + " [ 36 52000]\n", + " [ 27 54000]\n", + " [ 26 118000]]\n" + ] + } + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "8dpDLojm1mVG", + "outputId": "0b4c4ef0-998a-4241-89d5-4ee23c22a60d", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(y_train)" + ], + "execution_count": 6, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[0 1 0 1 1 1 0 0 0 0 0 0 1 1 1 0 1 0 0 1 0 1 0 1 0 0 1 1 1 1 0 1 0 1 0 0 1\n", + " 0 0 1 0 0 0 0 0 1 1 1 1 0 0 0 1 0 1 0 1 0 0 1 0 0 0 1 0 0 0 1 1 0 0 1 0 1\n", + " 1 1 0 0 1 1 0 0 1 1 0 1 0 0 1 1 0 1 1 1 0 0 0 0 0 1 0 0 1 1 1 1 1 0 1 1 0\n", + " 1 0 0 0 0 0 0 0 1 1 0 0 1 0 0 1 0 0 0 1 0 1 1 0 1 0 0 0 0 1 0 0 0 1 1 0 0\n", + " 0 0 1 0 1 0 0 0 1 0 0 0 0 1 1 1 0 0 0 0 0 0 1 1 1 1 1 0 1 0 0 0 0 0 1 0 0\n", + " 0 0 0 0 1 1 0 1 0 1 0 0 1 0 0 0 1 0 0 0 0 0 1 0 0 0 0 0 1 0 1 1 0 0 0 0 0\n", + " 0 1 1 0 0 0 0 1 0 0 0 0 1 0 1 0 1 0 0 0 1 0 0 0 1 0 1 0 0 0 0 0 1 1 0 0 0\n", + " 0 0 1 0 1 1 0 0 0 0 0 1 0 1 0 0 1 0 0 1 0 1 0 0 0 0 0 0 1 1 1 1 0 0 0 0 1\n", + " 0 0 0 0]\n" + ] + } + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "qbb7i0DH1qui", + "outputId": "6546bca3-131e-480e-a0f9-36ab8a64a7e0", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(X_test)" + ], + "execution_count": 7, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[ 30 87000]\n", + " [ 38 50000]\n", + " [ 35 75000]\n", + " [ 30 79000]\n", + " [ 35 50000]\n", + " [ 27 20000]\n", + " [ 31 15000]\n", + " [ 36 144000]\n", + " [ 18 68000]\n", + " [ 47 43000]\n", + " [ 30 49000]\n", + " [ 28 55000]\n", + " [ 37 55000]\n", + " [ 39 77000]\n", + " [ 20 86000]\n", + " [ 32 117000]\n", + " [ 37 77000]\n", + " [ 19 85000]\n", + " [ 55 130000]\n", + " [ 35 22000]\n", + " [ 35 47000]\n", + " [ 47 144000]\n", + " [ 41 51000]\n", + " [ 47 105000]\n", + " [ 23 28000]\n", + " [ 49 141000]\n", + " [ 28 87000]\n", + " [ 29 80000]\n", + " [ 37 62000]\n", + " [ 32 86000]\n", + " [ 21 88000]\n", + " [ 37 79000]\n", + " [ 57 60000]\n", + " [ 37 53000]\n", + " [ 24 58000]\n", + " [ 18 52000]\n", + " [ 22 81000]\n", + " [ 34 43000]\n", + " [ 31 34000]\n", + " [ 49 36000]\n", + " [ 27 88000]\n", + " [ 41 52000]\n", + " [ 27 84000]\n", + " [ 35 20000]\n", + " [ 43 112000]\n", + " [ 27 58000]\n", + " [ 37 80000]\n", + " [ 52 90000]\n", + " [ 26 30000]\n", + " [ 49 86000]\n", + " [ 57 122000]\n", + " [ 34 25000]\n", + " [ 35 57000]\n", + " [ 34 115000]\n", + " [ 59 88000]\n", + " [ 45 32000]\n", + " [ 29 83000]\n", + " [ 26 80000]\n", + " [ 49 28000]\n", + " [ 23 20000]\n", + " [ 32 18000]\n", + " [ 60 42000]\n", + " [ 19 76000]\n", + " [ 36 99000]\n", + " [ 19 26000]\n", + " [ 60 83000]\n", + " [ 24 89000]\n", + " [ 27 58000]\n", + " [ 40 47000]\n", + " [ 42 70000]\n", + " [ 32 150000]\n", + " [ 35 77000]\n", + " [ 22 63000]\n", + " [ 45 22000]\n", + " [ 27 89000]\n", + " [ 18 82000]\n", + " [ 42 79000]\n", + " [ 40 60000]\n", + " [ 53 34000]\n", + " [ 47 107000]\n", + " [ 58 144000]\n", + " [ 59 83000]\n", + " [ 24 55000]\n", + " [ 26 35000]\n", + " [ 58 38000]\n", + " [ 42 80000]\n", + " [ 40 75000]\n", + " [ 59 130000]\n", + " [ 46 41000]\n", + " [ 41 60000]\n", + " [ 42 64000]\n", + " [ 37 146000]\n", + " [ 23 48000]\n", + " [ 25 33000]\n", + " [ 24 84000]\n", + " [ 27 96000]\n", + " [ 23 63000]\n", + " [ 48 33000]\n", + " [ 48 90000]\n", + " [ 42 104000]]\n" + ] + } + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "kj1hnFAR1s5w", + "outputId": "46e7ef2d-fac1-4a75-fd82-c79e8d535ba3", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(y_test)" + ], + "execution_count": 8, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 0 1 0 0 1 0 1 0 1 0 0 0 0 0 1 1 0 0 0 0\n", + " 0 0 1 0 0 0 0 1 0 0 1 0 1 1 0 0 0 1 1 0 0 1 0 0 1 0 1 0 1 0 0 0 0 1 0 0 1\n", + " 0 0 0 0 1 1 1 0 0 0 1 1 0 1 1 0 0 1 0 0 0 1 0 1 1 1]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "kW3c7UYih0hT" + }, + "source": [ + "## Feature Scaling" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "9fQlDPKCh8sc" + }, + "source": [ + "from sklearn.preprocessing import StandardScaler\n", + "sc = StandardScaler()\n", + "X_train = sc.fit_transform(X_train)\n", + "X_test = sc.transform(X_test)" + ], + "execution_count": 9, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "syrnD1Op2BSR", + "outputId": "fdeec0e5-27a4-496b-b006-15bf2474a301", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(X_train)" + ], + "execution_count": 10, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[ 0.58164944 -0.88670699]\n", + " [-0.60673761 1.46173768]\n", + " [-0.01254409 -0.5677824 ]\n", + " [-0.60673761 1.89663484]\n", + " [ 1.37390747 -1.40858358]\n", + " [ 1.47293972 0.99784738]\n", + " [ 0.08648817 -0.79972756]\n", + " [-0.01254409 -0.24885782]\n", + " [-0.21060859 -0.5677824 ]\n", + " [-0.21060859 -0.19087153]\n", + " [-0.30964085 -1.29261101]\n", + " [-0.30964085 -0.5677824 ]\n", + " [ 0.38358493 0.09905991]\n", + " [ 0.8787462 -0.59677555]\n", + " [ 2.06713324 -1.17663843]\n", + " [ 1.07681071 -0.13288524]\n", + " [ 0.68068169 1.78066227]\n", + " [-0.70576986 0.56295021]\n", + " [ 0.77971394 0.35999821]\n", + " [ 0.8787462 -0.53878926]\n", + " [-1.20093113 -1.58254245]\n", + " [ 2.1661655 0.93986109]\n", + " [-0.01254409 1.22979253]\n", + " [ 0.18552042 1.08482681]\n", + " [ 0.38358493 -0.48080297]\n", + " [-0.30964085 -0.30684411]\n", + " [ 0.97777845 -0.8287207 ]\n", + " [ 0.97777845 1.8676417 ]\n", + " [-0.01254409 1.25878567]\n", + " [-0.90383437 2.27354572]\n", + " [-1.20093113 -1.58254245]\n", + " [ 2.1661655 -0.79972756]\n", + " [-1.39899564 -1.46656987]\n", + " [ 0.38358493 2.30253886]\n", + " [ 0.77971394 0.76590222]\n", + " [-1.00286662 -0.30684411]\n", + " [ 0.08648817 0.76590222]\n", + " [-1.00286662 0.56295021]\n", + " [ 0.28455268 0.07006676]\n", + " [ 0.68068169 -1.26361786]\n", + " [-0.50770535 -0.01691267]\n", + " [-1.79512465 0.35999821]\n", + " [-0.70576986 0.12805305]\n", + " [ 0.38358493 0.30201192]\n", + " [-0.30964085 0.07006676]\n", + " [-0.50770535 2.30253886]\n", + " [ 0.18552042 0.04107362]\n", + " [ 1.27487521 2.21555943]\n", + " [ 0.77971394 0.27301877]\n", + " [-0.30964085 0.1570462 ]\n", + " [-0.01254409 -0.53878926]\n", + " [-0.21060859 0.1570462 ]\n", + " [-0.11157634 0.24402563]\n", + " [-0.01254409 -0.24885782]\n", + " [ 2.1661655 1.11381995]\n", + " [-1.79512465 0.35999821]\n", + " [ 1.86906873 0.12805305]\n", + " [ 0.38358493 -0.13288524]\n", + " [-1.20093113 0.30201192]\n", + " [ 0.77971394 1.37475825]\n", + " [-0.30964085 -0.24885782]\n", + " [-1.6960924 -0.04590581]\n", + " [-1.00286662 -0.74174127]\n", + " [ 0.28455268 0.50496393]\n", + " [-0.11157634 -1.06066585]\n", + " [-1.10189888 0.59194336]\n", + " [ 0.08648817 -0.79972756]\n", + " [-1.00286662 1.54871711]\n", + " [-0.70576986 1.40375139]\n", + " [-1.29996338 0.50496393]\n", + " [-0.30964085 0.04107362]\n", + " [-0.11157634 0.01208048]\n", + " [-0.30964085 -0.88670699]\n", + " [ 0.8787462 -1.3505973 ]\n", + " [-0.30964085 2.24455257]\n", + " [ 0.97777845 1.98361427]\n", + " [-1.20093113 0.47597078]\n", + " [-1.29996338 0.27301877]\n", + " [ 1.37390747 1.98361427]\n", + " [ 1.27487521 -1.3505973 ]\n", + " [-0.30964085 -0.27785096]\n", + " [-0.50770535 1.25878567]\n", + " [-0.80480212 1.08482681]\n", + " [ 0.97777845 -1.06066585]\n", + " [ 0.28455268 0.30201192]\n", + " [ 0.97777845 0.76590222]\n", + " [-0.70576986 -1.49556302]\n", + " [-0.70576986 0.04107362]\n", + " [ 0.48261718 1.72267598]\n", + " [ 2.06713324 0.18603934]\n", + " [-1.99318916 -0.74174127]\n", + " [-0.21060859 1.40375139]\n", + " [ 0.38358493 0.59194336]\n", + " [ 0.8787462 -1.14764529]\n", + " [-1.20093113 -0.77073441]\n", + " [ 0.18552042 0.24402563]\n", + " [ 0.77971394 -0.30684411]\n", + " [ 2.06713324 -0.79972756]\n", + " [ 0.77971394 0.12805305]\n", + " [-0.30964085 0.6209365 ]\n", + " [-1.00286662 -0.30684411]\n", + " [ 0.18552042 -0.3648304 ]\n", + " [ 2.06713324 2.12857999]\n", + " [ 1.86906873 -1.26361786]\n", + " [ 1.37390747 -0.91570013]\n", + " [ 0.8787462 1.25878567]\n", + " [ 1.47293972 2.12857999]\n", + " [-0.30964085 -1.23462472]\n", + " [ 1.96810099 0.91086794]\n", + " [ 0.68068169 -0.71274813]\n", + " [-1.49802789 0.35999821]\n", + " [ 0.77971394 -1.3505973 ]\n", + " [ 0.38358493 -0.13288524]\n", + " [-1.00286662 0.41798449]\n", + " [-0.01254409 -0.30684411]\n", + " [-1.20093113 0.41798449]\n", + " [-0.90383437 -1.20563157]\n", + " [-0.11157634 0.04107362]\n", + " [-1.59706014 -0.42281668]\n", + " [ 0.97777845 -1.00267957]\n", + " [ 1.07681071 -1.20563157]\n", + " [-0.01254409 -0.13288524]\n", + " [-1.10189888 -1.52455616]\n", + " [ 0.77971394 -1.20563157]\n", + " [ 0.97777845 2.07059371]\n", + " [-1.20093113 -1.52455616]\n", + " [-0.30964085 0.79489537]\n", + " [ 0.08648817 -0.30684411]\n", + " [-1.39899564 -1.23462472]\n", + " [-0.60673761 -1.49556302]\n", + " [ 0.77971394 0.53395707]\n", + " [-0.30964085 -0.33583725]\n", + " [ 1.77003648 -0.27785096]\n", + " [ 0.8787462 -1.03167271]\n", + " [ 0.18552042 0.07006676]\n", + " [-0.60673761 0.8818748 ]\n", + " [-1.89415691 -1.40858358]\n", + " [-1.29996338 0.59194336]\n", + " [-0.30964085 0.53395707]\n", + " [-1.00286662 -1.089659 ]\n", + " [ 1.17584296 -1.43757673]\n", + " [ 0.18552042 -0.30684411]\n", + " [ 1.17584296 -0.74174127]\n", + " [-0.30964085 0.07006676]\n", + " [ 0.18552042 2.09958685]\n", + " [ 0.77971394 -1.089659 ]\n", + " [ 0.08648817 0.04107362]\n", + " [-1.79512465 0.12805305]\n", + " [-0.90383437 0.1570462 ]\n", + " [-0.70576986 0.18603934]\n", + " [ 0.8787462 -1.29261101]\n", + " [ 0.18552042 -0.24885782]\n", + " [-0.4086731 1.22979253]\n", + " [-0.01254409 0.30201192]\n", + " [ 0.38358493 0.1570462 ]\n", + " [ 0.8787462 -0.65476184]\n", + " [ 0.08648817 0.1570462 ]\n", + " [-1.89415691 -1.29261101]\n", + " [-0.11157634 0.30201192]\n", + " [-0.21060859 -0.27785096]\n", + " [ 0.28455268 -0.50979612]\n", + " [-0.21060859 1.6067034 ]\n", + " [ 0.97777845 -1.17663843]\n", + " [-0.21060859 1.63569655]\n", + " [ 1.27487521 1.8676417 ]\n", + " [-1.10189888 -0.3648304 ]\n", + " [-0.01254409 0.04107362]\n", + " [ 0.08648817 -0.24885782]\n", + " [-1.59706014 -1.23462472]\n", + " [-0.50770535 -0.27785096]\n", + " [ 0.97777845 0.12805305]\n", + " [ 1.96810099 -1.3505973 ]\n", + " [ 1.47293972 0.07006676]\n", + " [-0.60673761 1.37475825]\n", + " [ 1.57197197 0.01208048]\n", + " [-0.80480212 0.30201192]\n", + " [ 1.96810099 0.73690908]\n", + " [-1.20093113 -0.50979612]\n", + " [ 0.68068169 0.27301877]\n", + " [-1.39899564 -0.42281668]\n", + " [ 0.18552042 0.1570462 ]\n", + " [-0.50770535 -1.20563157]\n", + " [ 0.58164944 2.01260742]\n", + " [-1.59706014 -1.49556302]\n", + " [-0.50770535 -0.53878926]\n", + " [ 0.48261718 1.83864855]\n", + " [-1.39899564 -1.089659 ]\n", + " [ 0.77971394 -1.37959044]\n", + " [-0.30964085 -0.42281668]\n", + " [ 1.57197197 0.99784738]\n", + " [ 0.97777845 1.43274454]\n", + " [-0.30964085 -0.48080297]\n", + " [-0.11157634 2.15757314]\n", + " [-1.49802789 -0.1038921 ]\n", + " [-0.11157634 1.95462113]\n", + " [-0.70576986 -0.33583725]\n", + " [-0.50770535 -0.8287207 ]\n", + " [ 0.68068169 -1.37959044]\n", + " [-0.80480212 -1.58254245]\n", + " [-1.89415691 -1.46656987]\n", + " [ 1.07681071 0.12805305]\n", + " [ 0.08648817 1.51972397]\n", + " [-0.30964085 0.09905991]\n", + " [ 0.08648817 0.04107362]\n", + " [-1.39899564 -1.3505973 ]\n", + " [ 0.28455268 0.07006676]\n", + " [-0.90383437 0.38899135]\n", + " [ 1.57197197 -1.26361786]\n", + " [-0.30964085 -0.74174127]\n", + " [-0.11157634 0.1570462 ]\n", + " [-0.90383437 -0.65476184]\n", + " [-0.70576986 -0.04590581]\n", + " [ 0.38358493 -0.45180983]\n", + " [-0.80480212 1.89663484]\n", + " [ 1.37390747 1.28777882]\n", + " [ 1.17584296 -0.97368642]\n", + " [ 1.77003648 1.83864855]\n", + " [-0.90383437 -0.24885782]\n", + " [-0.80480212 0.56295021]\n", + " [-1.20093113 -1.5535493 ]\n", + " [-0.50770535 -1.11865214]\n", + " [ 0.28455268 0.07006676]\n", + " [-0.21060859 -1.06066585]\n", + " [ 1.67100423 1.6067034 ]\n", + " [ 0.97777845 1.78066227]\n", + " [ 0.28455268 0.04107362]\n", + " [-0.80480212 -0.21986468]\n", + " [-0.11157634 0.07006676]\n", + " [ 0.28455268 -0.19087153]\n", + " [ 1.96810099 -0.65476184]\n", + " [-0.80480212 1.3457651 ]\n", + " [-1.79512465 -0.59677555]\n", + " [-0.11157634 0.12805305]\n", + " [ 0.28455268 -0.30684411]\n", + " [ 1.07681071 0.56295021]\n", + " [-1.00286662 0.27301877]\n", + " [ 1.47293972 0.35999821]\n", + " [ 0.18552042 -0.3648304 ]\n", + " [ 2.1661655 -1.03167271]\n", + " [-0.30964085 1.11381995]\n", + " [-1.6960924 0.07006676]\n", + " [-0.01254409 0.04107362]\n", + " [ 0.08648817 1.05583366]\n", + " [-0.11157634 -0.3648304 ]\n", + " [-1.20093113 0.07006676]\n", + " [-0.30964085 -1.3505973 ]\n", + " [ 1.57197197 1.11381995]\n", + " [-0.80480212 -1.52455616]\n", + " [ 0.08648817 1.8676417 ]\n", + " [-0.90383437 -0.77073441]\n", + " [-0.50770535 -0.77073441]\n", + " [-0.30964085 -0.91570013]\n", + " [ 0.28455268 -0.71274813]\n", + " [ 0.28455268 0.07006676]\n", + " [ 0.08648817 1.8676417 ]\n", + " [-1.10189888 1.95462113]\n", + " [-1.6960924 -1.5535493 ]\n", + " [-1.20093113 -1.089659 ]\n", + " [-0.70576986 -0.1038921 ]\n", + " [ 0.08648817 0.09905991]\n", + " [ 0.28455268 0.27301877]\n", + " [ 0.8787462 -0.5677824 ]\n", + " [ 0.28455268 -1.14764529]\n", + " [-0.11157634 0.67892279]\n", + " [ 2.1661655 -0.68375498]\n", + " [-1.29996338 -1.37959044]\n", + " [-1.00286662 -0.94469328]\n", + " [-0.01254409 -0.42281668]\n", + " [-0.21060859 -0.45180983]\n", + " [-1.79512465 -0.97368642]\n", + " [ 1.77003648 0.99784738]\n", + " [ 0.18552042 -0.3648304 ]\n", + " [ 0.38358493 1.11381995]\n", + " [-1.79512465 -1.3505973 ]\n", + " [ 0.18552042 -0.13288524]\n", + " [ 0.8787462 -1.43757673]\n", + " [-1.99318916 0.47597078]\n", + " [-0.30964085 0.27301877]\n", + " [ 1.86906873 -1.06066585]\n", + " [-0.4086731 0.07006676]\n", + " [ 1.07681071 -0.88670699]\n", + " [-1.10189888 -1.11865214]\n", + " [-1.89415691 0.01208048]\n", + " [ 0.08648817 0.27301877]\n", + " [-1.20093113 0.33100506]\n", + " [-1.29996338 0.30201192]\n", + " [-1.00286662 0.44697764]\n", + " [ 1.67100423 -0.88670699]\n", + " [ 1.17584296 0.53395707]\n", + " [ 1.07681071 0.53395707]\n", + " [ 1.37390747 2.331532 ]\n", + " [-0.30964085 -0.13288524]\n", + " [ 0.38358493 -0.45180983]\n", + " [-0.4086731 -0.77073441]\n", + " [-0.11157634 -0.50979612]\n", + " [ 0.97777845 -1.14764529]\n", + " [-0.90383437 -0.77073441]\n", + " [-0.21060859 -0.50979612]\n", + " [-1.10189888 -0.45180983]\n", + " [-1.20093113 1.40375139]]\n" + ] + } + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "JUd6iBRp2C3L", + "outputId": "bbbd8f93-1be0-4902-c263-c0121200c17b", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(X_test)" + ], + "execution_count": 11, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[-0.80480212 0.50496393]\n", + " [-0.01254409 -0.5677824 ]\n", + " [-0.30964085 0.1570462 ]\n", + " [-0.80480212 0.27301877]\n", + " [-0.30964085 -0.5677824 ]\n", + " [-1.10189888 -1.43757673]\n", + " [-0.70576986 -1.58254245]\n", + " [-0.21060859 2.15757314]\n", + " [-1.99318916 -0.04590581]\n", + " [ 0.8787462 -0.77073441]\n", + " [-0.80480212 -0.59677555]\n", + " [-1.00286662 -0.42281668]\n", + " [-0.11157634 -0.42281668]\n", + " [ 0.08648817 0.21503249]\n", + " [-1.79512465 0.47597078]\n", + " [-0.60673761 1.37475825]\n", + " [-0.11157634 0.21503249]\n", + " [-1.89415691 0.44697764]\n", + " [ 1.67100423 1.75166912]\n", + " [-0.30964085 -1.37959044]\n", + " [-0.30964085 -0.65476184]\n", + " [ 0.8787462 2.15757314]\n", + " [ 0.28455268 -0.53878926]\n", + " [ 0.8787462 1.02684052]\n", + " [-1.49802789 -1.20563157]\n", + " [ 1.07681071 2.07059371]\n", + " [-1.00286662 0.50496393]\n", + " [-0.90383437 0.30201192]\n", + " [-0.11157634 -0.21986468]\n", + " [-0.60673761 0.47597078]\n", + " [-1.6960924 0.53395707]\n", + " [-0.11157634 0.27301877]\n", + " [ 1.86906873 -0.27785096]\n", + " [-0.11157634 -0.48080297]\n", + " [-1.39899564 -0.33583725]\n", + " [-1.99318916 -0.50979612]\n", + " [-1.59706014 0.33100506]\n", + " [-0.4086731 -0.77073441]\n", + " [-0.70576986 -1.03167271]\n", + " [ 1.07681071 -0.97368642]\n", + " [-1.10189888 0.53395707]\n", + " [ 0.28455268 -0.50979612]\n", + " [-1.10189888 0.41798449]\n", + " [-0.30964085 -1.43757673]\n", + " [ 0.48261718 1.22979253]\n", + " [-1.10189888 -0.33583725]\n", + " [-0.11157634 0.30201192]\n", + " [ 1.37390747 0.59194336]\n", + " [-1.20093113 -1.14764529]\n", + " [ 1.07681071 0.47597078]\n", + " [ 1.86906873 1.51972397]\n", + " [-0.4086731 -1.29261101]\n", + " [-0.30964085 -0.3648304 ]\n", + " [-0.4086731 1.31677196]\n", + " [ 2.06713324 0.53395707]\n", + " [ 0.68068169 -1.089659 ]\n", + " [-0.90383437 0.38899135]\n", + " [-1.20093113 0.30201192]\n", + " [ 1.07681071 -1.20563157]\n", + " [-1.49802789 -1.43757673]\n", + " [-0.60673761 -1.49556302]\n", + " [ 2.1661655 -0.79972756]\n", + " [-1.89415691 0.18603934]\n", + " [-0.21060859 0.85288166]\n", + " [-1.89415691 -1.26361786]\n", + " [ 2.1661655 0.38899135]\n", + " [-1.39899564 0.56295021]\n", + " [-1.10189888 -0.33583725]\n", + " [ 0.18552042 -0.65476184]\n", + " [ 0.38358493 0.01208048]\n", + " [-0.60673761 2.331532 ]\n", + " [-0.30964085 0.21503249]\n", + " [-1.59706014 -0.19087153]\n", + " [ 0.68068169 -1.37959044]\n", + " [-1.10189888 0.56295021]\n", + " [-1.99318916 0.35999821]\n", + " [ 0.38358493 0.27301877]\n", + " [ 0.18552042 -0.27785096]\n", + " [ 1.47293972 -1.03167271]\n", + " [ 0.8787462 1.08482681]\n", + " [ 1.96810099 2.15757314]\n", + " [ 2.06713324 0.38899135]\n", + " [-1.39899564 -0.42281668]\n", + " [-1.20093113 -1.00267957]\n", + " [ 1.96810099 -0.91570013]\n", + " [ 0.38358493 0.30201192]\n", + " [ 0.18552042 0.1570462 ]\n", + " [ 2.06713324 1.75166912]\n", + " [ 0.77971394 -0.8287207 ]\n", + " [ 0.28455268 -0.27785096]\n", + " [ 0.38358493 -0.16187839]\n", + " [-0.11157634 2.21555943]\n", + " [-1.49802789 -0.62576869]\n", + " [-1.29996338 -1.06066585]\n", + " [-1.39899564 0.41798449]\n", + " [-1.10189888 0.76590222]\n", + " [-1.49802789 -0.19087153]\n", + " [ 0.97777845 -1.06066585]\n", + " [ 0.97777845 0.59194336]\n", + " [ 0.38358493 0.99784738]]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "bb6jCOCQiAmP" + }, + "source": [ + "## Training the Decision Tree Classification model on the Training set" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "e0pFVAmciHQs", + "outputId": "3b64c077-3313-4ae6-d504-a47e92476bb8", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 75 + } + }, + "source": [ + "from sklearn.tree import DecisionTreeClassifier\n", + "classifier = DecisionTreeClassifier(criterion = 'entropy', random_state = 0)\n", + "classifier.fit(X_train, y_train)" + ], + "execution_count": 12, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "DecisionTreeClassifier(criterion='entropy', random_state=0)" + ], + "text/html": [ + "
DecisionTreeClassifier(criterion='entropy', random_state=0)
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" + ] + }, + "metadata": {}, + "execution_count": 12 + } + ] + }, + { + "cell_type": "code", + "source": [ + "from sklearn.model_selection import GridSearchCV\n", + "\n", + "param_grid = {\n", + " 'criterion': ['gini', 'entropy'],\n", + " 'max_depth': [None, 5, 10, 15, 20],\n", + " 'min_samples_split': [2, 5, 10],\n", + " 'min_samples_leaf': [1, 2, 4]\n", + "}\n", + "\n", + "grid_search = GridSearchCV(classifier, param_grid, cv=5, n_jobs=-1)\n", + "grid_search.fit(X_train, y_train)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 118 + }, + "id": "nMAeSTIu-Gnp", + "outputId": "cf30e579-42ed-4d0a-b48c-fb4bbb3f2d07" + }, + "execution_count": 21, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "GridSearchCV(cv=5,\n", + " estimator=DecisionTreeClassifier(criterion='entropy',\n", + " random_state=0),\n", + " n_jobs=-1,\n", + " param_grid={'criterion': ['gini', 'entropy'],\n", + " 'max_depth': [None, 5, 10, 15, 20],\n", + " 'min_samples_leaf': [1, 2, 4],\n", + " 'min_samples_split': [2, 5, 10]})" + ], + "text/html": [ + "
GridSearchCV(cv=5,\n",
+              "             estimator=DecisionTreeClassifier(criterion='entropy',\n",
+              "                                              random_state=0),\n",
+              "             n_jobs=-1,\n",
+              "             param_grid={'criterion': ['gini', 'entropy'],\n",
+              "                         'max_depth': [None, 5, 10, 15, 20],\n",
+              "                         'min_samples_leaf': [1, 2, 4],\n",
+              "                         'min_samples_split': [2, 5, 10]})
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" + ] + }, + "metadata": {}, + "execution_count": 21 + } + ] + }, + { + "cell_type": "code", + "source": [ + "best_params = grid_search.best_params_\n", + "best_model = grid_search.best_estimator_" + ], + "metadata": { + "id": "FlHm8EiS_bou" + }, + "execution_count": 22, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "print(best_params)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "KHniqmyz__y4", + "outputId": "0234af4f-0e8c-4173-cee2-fa164f7f7e09" + }, + "execution_count": 24, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "{'criterion': 'entropy', 'max_depth': 5, 'min_samples_leaf': 4, 'min_samples_split': 2}\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "yyxW5b395mR2" + }, + "source": [ + "## Predicting a new result" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "f8YOXsQy58rP", + "outputId": "b77baaea-adc9-41f2-8268-908b4fbad7f6", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "print(classifier.predict(sc.transform([[30,87000]])))" + ], + "execution_count": 13, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[0]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "vKYVQH-l5NpE" + }, + "source": [ + "## Predicting the Test set results" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "p6VMTb2O4hwM", + "outputId": "54cc80ed-a231-4054-bddc-f02f62f2b92c", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "y_pred = classifier.predict(X_test)\n", + "print(np.concatenate((y_pred.reshape(len(y_pred),1), y_test.reshape(len(y_test),1)),1))" + ], + "execution_count": 14, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 0]\n", + " [0 0]\n", + " [1 0]\n", + " [1 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 1]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [1 1]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 0]\n", + " [1 1]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [1 1]\n", + " [1 1]\n", + " [1 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 1]\n", + " [0 0]\n", + " [1 1]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [0 0]\n", + " [0 0]\n", + " [1 1]\n", + " [0 0]\n", + " [1 1]\n", + " [1 1]\n", + " [1 1]]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "h4Hwj34ziWQW" + }, + "source": [ + "## Making the Confusion Matrix" + ] + }, + { + "cell_type": "code", + "source": [ + "accuracy = best_model.score(X_test, y_test)\n", + "print(\"Best Model Accuracy:\", accuracy)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "V77dtvP9_hcz", + "outputId": "9c66432d-1880-48a7-b245-2b36d63d7c59" + }, + "execution_count": 23, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Best Model Accuracy: 0.94\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "from sklearn.metrics import confusion_matrix, accuracy_score\n", + "cm = confusion_matrix(y_test, y_pred1)\n", + "print(cm)\n", + "accuracy_score(y_test, y_pred1)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "M2WsXkhm-Q4w", + "outputId": "f123de83-3864-4860-cf1d-95e3a68f97d2" + }, + "execution_count": 20, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[62 6]\n", + " [ 4 28]]\n" + ] + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "0.9" + ] + }, + "metadata": {}, + "execution_count": 20 + } + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "D6bpZwUiiXic", + "outputId": "e37696d8-cfb7-4170-d3fc-88423a8ec8a7", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "source": [ + "from sklearn.metrics import confusion_matrix, accuracy_score\n", + "cm = confusion_matrix(y_test, y_pred)\n", + "print(cm)\n", + "accuracy_score(y_test, y_pred)" + ], + "execution_count": 15, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[62 6]\n", + " [ 3 29]]\n" + ] + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "0.91" + ] + }, + "metadata": {}, + "execution_count": 15 + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "6OMC_P0diaoD" + }, + "source": [ + "## Visualising the Training set results" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "_NOjKvZRid5l", + "outputId": "d655d1ff-9d65-4dec-8c32-114118b28aa2", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 527 + } + }, + "source": [ + "from matplotlib.colors import ListedColormap\n", + "X_set, y_set = sc.inverse_transform(X_train), y_train\n", + "X1, X2 = np.meshgrid(np.arange(start = X_set[:, 0].min() - 10, stop = X_set[:, 0].max() + 10, step = 0.25),\n", + " np.arange(start = X_set[:, 1].min() - 1000, stop = X_set[:, 1].max() + 1000, step = 0.25))\n", + "plt.contourf(X1, X2, classifier.predict(sc.transform(np.array([X1.ravel(), X2.ravel()]).T)).reshape(X1.shape),\n", + " alpha = 0.75, cmap = ListedColormap(('red', 'green')))\n", + "plt.xlim(X1.min(), X1.max())\n", + "plt.ylim(X2.min(), X2.max())\n", + "for i, j in enumerate(np.unique(y_set)):\n", + " plt.scatter(X_set[y_set == j, 0], X_set[y_set == j, 1], c = ListedColormap(('red', 'green'))(i), label = j)\n", + "plt.title('Decision Tree Classification (Training set)')\n", + "plt.xlabel('Age')\n", + "plt.ylabel('Estimated Salary')\n", + "plt.legend()\n", + "plt.show()" + ], + "execution_count": 16, + "outputs": [ + { + "output_type": "stream", + "name": "stderr", + "text": [ + ":10: UserWarning: *c* argument looks like a single numeric RGB or RGBA sequence, which should be avoided as value-mapping will have precedence in case its length matches with *x* & *y*. Please use the *color* keyword-argument or provide a 2D array with a single row if you intend to specify the same RGB or RGBA value for all points.\n", + " plt.scatter(X_set[y_set == j, 0], X_set[y_set == j, 1], c = ListedColormap(('red', 'green'))(i), label = j)\n" + ] + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "SZ-j28aPihZx" + }, + "source": [ + "## Visualising the Test set results" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "qeTjz2vDilAC", + "outputId": "ee634ff6-2fc8-40f4-cd47-b9bd2b99887b", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 808 + } + }, + "source": [ + "from matplotlib.colors import ListedColormap\n", + "X_set, y_set = sc.inverse_transform(X_test), y_test\n", + "X1, X2 = np.meshgrid(np.arange(start = X_set[:, 0].min() - 10, stop = X_set[:, 0].max() + 10, step = 0.25),\n", + " np.arange(start = X_set[:, 1].min() - 1000, stop = X_set[:, 1].max() + 1000, step = 0.25))\n", + "plt.contourf(X1, X2, classifier.predict(sc.transform(np.array([X1.ravel(), X2.ravel()]).T)).reshape(X1.shape),\n", + " alpha = 0.75, cmap = ListedColormap(('red', 'green')))\n", + "plt.xlim(X1.min(), X1.max())\n", + "plt.ylim(X2.min(), X2.max())\n", + "for i, j in enumerate(np.unique(y_set)):\n", + " plt.scatter(X_set[y_set == j, 0], X_set[y_set == j, 1], c = ListedColormap(('red', 'green'))(i), label = j)\n", + "plt.title('Decision Tree Classification (Test set)')\n", + "plt.xlabel('Age')\n", + "plt.ylabel('Estimated Salary')\n", + "plt.legend()\n", + "plt.show()" + ], + "execution_count": 17, + "outputs": [ + { + "output_type": "error", + "ename": "KeyboardInterrupt", + "evalue": "ignored", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 3\u001b[0m X1, X2 = np.meshgrid(np.arange(start = X_set[:, 0].min() - 10, stop = X_set[:, 0].max() + 10, step = 0.25),\n\u001b[1;32m 4\u001b[0m np.arange(start = X_set[:, 1].min() - 1000, stop = X_set[:, 1].max() + 1000, step = 0.25))\n\u001b[0;32m----> 5\u001b[0;31m plt.contourf(X1, X2, classifier.predict(sc.transform(np.array([X1.ravel(), X2.ravel()]).T)).reshape(X1.shape),\n\u001b[0m\u001b[1;32m 6\u001b[0m alpha = 0.75, cmap = ListedColormap(('red', 'green')))\n\u001b[1;32m 7\u001b[0m \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mxlim\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mX1\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX1\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmax\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/matplotlib/pyplot.py\u001b[0m in \u001b[0;36mcontourf\u001b[0;34m(data, *args, **kwargs)\u001b[0m\n\u001b[1;32m 2535\u001b[0m \u001b[0;34m@\u001b[0m\u001b[0m_copy_docstring_and_deprecators\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mAxes\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcontourf\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2536\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mcontourf\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 2537\u001b[0;31m __ret = gca().contourf(\n\u001b[0m\u001b[1;32m 2538\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0;34m\"data\"\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m}\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mdata\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0;34m{\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2539\u001b[0m **kwargs)\n", + "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/matplotlib/__init__.py\u001b[0m in \u001b[0;36minner\u001b[0;34m(ax, data, *args, **kwargs)\u001b[0m\n\u001b[1;32m 1440\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0minner\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0max\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1441\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mdata\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1442\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0max\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0mmap\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msanitize_sequence\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1443\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1444\u001b[0m \u001b[0mbound\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnew_sig\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbind\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0max\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/matplotlib/axes/_axes.py\u001b[0m in \u001b[0;36mcontourf\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 6465\u001b[0m \"\"\"\n\u001b[1;32m 6466\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'filled'\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 6467\u001b[0;31m \u001b[0mcontours\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmcontour\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mQuadContourSet\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 6468\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_request_autoscale_view\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 6469\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mcontours\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/matplotlib/contour.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, ax, levels, filled, linewidths, linestyles, hatches, alpha, origin, extent, cmap, colors, norm, vmin, vmax, extend, antialiased, nchunk, locator, transform, negative_linestyles, *args, **kwargs)\u001b[0m\n\u001b[1;32m 821\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 822\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mgetattr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'allsegs'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 823\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mallsegs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mallkinds\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_get_allsegs_and_allkinds\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 824\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mallkinds\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 825\u001b[0m \u001b[0;31m# allsegs specified in constructor may or may not have allkinds as\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/matplotlib/contour.py\u001b[0m in \u001b[0;36m_get_allsegs_and_allkinds\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 1004\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mlevel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mlevel_upper\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mzip\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlowers\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0muppers\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1005\u001b[0m \u001b[0mvertices\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkinds\u001b[0m \u001b[0;34m=\u001b[0m\u001b[0;31m \u001b[0m\u001b[0;31m\\\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1006\u001b[0;31m self._contour_generator.create_filled_contour(\n\u001b[0m\u001b[1;32m 1007\u001b[0m level, level_upper)\n\u001b[1;32m 1008\u001b[0m \u001b[0mallsegs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mappend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mvertices\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mKeyboardInterrupt\u001b[0m: " + ] + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + } + ] +} \ No newline at end of file