{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"provenance":[],"collapsed_sections":[],"authorship_tag":"ABX9TyN1XagztLOzsfPrdgtTm2ZH"},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"}},"cells":[{"cell_type":"markdown","source":["# **UTS Data Mining**"],"metadata":{"id":"hLKqVf4RRQBz"}},{"cell_type":"markdown","source":["### Klasifikasi Data Pada Dataset Breats Cancer"],"metadata":{"id":"dpr8fvexVU_U"}},{"cell_type":"markdown","source":["Lakukan analisa terhadap data pada\n","https://archive.ics.uci.edu/ml/datasets/Breast+Cancer+Coimbra dengan menggunakan klasifikasi\n","\n"," - Metode KNN\n","\n"," - Metode pohon keputusan (Desision tree)"],"metadata":{"id":"Sod8cg80Vacv"}},{"cell_type":"markdown","source":["## Data"],"metadata":{"id":"qRrRZ65QV7WZ"}},{"cell_type":"code","execution_count":60,"metadata":{"id":"6hUZnrOCQ1af","executionInfo":{"status":"ok","timestamp":1665968941292,"user_tz":-420,"elapsed":371,"user":{"displayName":"Caca Erha","userId":"13359221303846732984"}}},"outputs":[],"source":["import numpy as np\n","import matplotlib.pyplot as plt\n","import seaborn as sns\n","import numba\n","import cv2 as cv\n","import pandas as pd\n","from sklearn.decomposition import PCA\n","from sklearn.neighbors import KNeighborsClassifier\n","from sklearn.metrics import confusion_matrix\n","from sklearn.model_selection import train_test_split\n","from sklearn.metrics import classification_report\n","from sklearn.tree import DecisionTreeClassifier\n","from sklearn.metrics import accuracy_score\n","from sklearn import tree\n","from matplotlib import pyplot as plt \n"]},{"cell_type":"code","source":["data = pd.read_csv(\"https://raw.githubusercontent.com/LALA09-erha/Python-StrukturData/master/dataR2.csv\")\n","data_1 = pd.read_csv(\"https://raw.githubusercontent.com/LALA09-erha/Python-StrukturData/master/dataR2.csv\")\n","data"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":424},"id":"EBWEN1F6Vv-Q","executionInfo":{"status":"ok","timestamp":1665968942371,"user_tz":-420,"elapsed":706,"user":{"displayName":"Caca Erha","userId":"13359221303846732984"}},"outputId":"333f0037-efdd-4bd6-f92f-8fc93be0ba09"},"execution_count":61,"outputs":[{"output_type":"execute_result","data":{"text/plain":[" Age BMI Glucose Insulin HOMA Leptin Adiponectin \\\n","0 48 23.500000 70 2.707 0.467409 8.8071 9.702400 \n","1 83 20.690495 92 3.115 0.706897 8.8438 5.429285 \n","2 82 23.124670 91 4.498 1.009651 17.9393 22.432040 \n","3 68 21.367521 77 3.226 0.612725 9.8827 7.169560 \n","4 86 21.111111 92 3.549 0.805386 6.6994 4.819240 \n",".. ... ... ... ... ... ... ... \n","111 45 26.850000 92 3.330 0.755688 54.6800 12.100000 \n","112 62 26.840000 100 4.530 1.117400 12.4500 21.420000 \n","113 65 32.050000 97 5.730 1.370998 61.4800 22.540000 \n","114 72 25.590000 82 2.820 0.570392 24.9600 33.750000 \n","115 86 27.180000 138 19.910 6.777364 90.2800 14.110000 \n","\n"," Resistin MCP.1 Classification \n","0 7.99585 417.114 1 \n","1 4.06405 468.786 1 \n","2 9.27715 554.697 1 \n","3 12.76600 928.220 1 \n","4 10.57635 773.920 1 \n",".. ... ... ... \n","111 10.96000 268.230 2 \n","112 7.32000 330.160 2 \n","113 10.33000 314.050 2 \n","114 3.27000 392.460 2 \n","115 4.35000 90.090 2 \n","\n","[116 rows x 10 columns]"],"text/html":["\n","
\n"," | Age | \n","BMI | \n","Glucose | \n","Insulin | \n","HOMA | \n","Leptin | \n","Adiponectin | \n","Resistin | \n","MCP.1 | \n","Classification | \n","
---|---|---|---|---|---|---|---|---|---|---|
0 | \n","48 | \n","23.500000 | \n","70 | \n","2.707 | \n","0.467409 | \n","8.8071 | \n","9.702400 | \n","7.99585 | \n","417.114 | \n","1 | \n","
1 | \n","83 | \n","20.690495 | \n","92 | \n","3.115 | \n","0.706897 | \n","8.8438 | \n","5.429285 | \n","4.06405 | \n","468.786 | \n","1 | \n","
2 | \n","82 | \n","23.124670 | \n","91 | \n","4.498 | \n","1.009651 | \n","17.9393 | \n","22.432040 | \n","9.27715 | \n","554.697 | \n","1 | \n","
3 | \n","68 | \n","21.367521 | \n","77 | \n","3.226 | \n","0.612725 | \n","9.8827 | \n","7.169560 | \n","12.76600 | \n","928.220 | \n","1 | \n","
4 | \n","86 | \n","21.111111 | \n","92 | \n","3.549 | \n","0.805386 | \n","6.6994 | \n","4.819240 | \n","10.57635 | \n","773.920 | \n","1 | \n","
... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","
111 | \n","45 | \n","26.850000 | \n","92 | \n","3.330 | \n","0.755688 | \n","54.6800 | \n","12.100000 | \n","10.96000 | \n","268.230 | \n","2 | \n","
112 | \n","62 | \n","26.840000 | \n","100 | \n","4.530 | \n","1.117400 | \n","12.4500 | \n","21.420000 | \n","7.32000 | \n","330.160 | \n","2 | \n","
113 | \n","65 | \n","32.050000 | \n","97 | \n","5.730 | \n","1.370998 | \n","61.4800 | \n","22.540000 | \n","10.33000 | \n","314.050 | \n","2 | \n","
114 | \n","72 | \n","25.590000 | \n","82 | \n","2.820 | \n","0.570392 | \n","24.9600 | \n","33.750000 | \n","3.27000 | \n","392.460 | \n","2 | \n","
115 | \n","86 | \n","27.180000 | \n","138 | \n","19.910 | \n","6.777364 | \n","90.2800 | \n","14.110000 | \n","4.35000 | \n","90.090 | \n","2 | \n","
116 rows × 10 columns
\n","\n"," | Age | \n","BMI | \n","Glucose | \n","Insulin | \n","HOMA | \n","Leptin | \n","Adiponectin | \n","Resistin | \n","MCP.1 | \n","Classification | \n","
---|---|---|---|---|---|---|---|---|---|---|
0 | \n","48 | \n","23.500000 | \n","70 | \n","2.707 | \n","0.467409 | \n","8.8071 | \n","9.702400 | \n","7.99585 | \n","417.114 | \n","Healthy controls | \n","
1 | \n","83 | \n","20.690495 | \n","92 | \n","3.115 | \n","0.706897 | \n","8.8438 | \n","5.429285 | \n","4.06405 | \n","468.786 | \n","Healthy controls | \n","
2 | \n","82 | \n","23.124670 | \n","91 | \n","4.498 | \n","1.009651 | \n","17.9393 | \n","22.432040 | \n","9.27715 | \n","554.697 | \n","Healthy controls | \n","
3 | \n","68 | \n","21.367521 | \n","77 | \n","3.226 | \n","0.612725 | \n","9.8827 | \n","7.169560 | \n","12.76600 | \n","928.220 | \n","Healthy controls | \n","
4 | \n","86 | \n","21.111111 | \n","92 | \n","3.549 | \n","0.805386 | \n","6.6994 | \n","4.819240 | \n","10.57635 | \n","773.920 | \n","Healthy controls | \n","
... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","
111 | \n","45 | \n","26.850000 | \n","92 | \n","3.330 | \n","0.755688 | \n","54.6800 | \n","12.100000 | \n","10.96000 | \n","268.230 | \n","Patients | \n","
112 | \n","62 | \n","26.840000 | \n","100 | \n","4.530 | \n","1.117400 | \n","12.4500 | \n","21.420000 | \n","7.32000 | \n","330.160 | \n","Patients | \n","
113 | \n","65 | \n","32.050000 | \n","97 | \n","5.730 | \n","1.370998 | \n","61.4800 | \n","22.540000 | \n","10.33000 | \n","314.050 | \n","Patients | \n","
114 | \n","72 | \n","25.590000 | \n","82 | \n","2.820 | \n","0.570392 | \n","24.9600 | \n","33.750000 | \n","3.27000 | \n","392.460 | \n","Patients | \n","
115 | \n","86 | \n","27.180000 | \n","138 | \n","19.910 | \n","6.777364 | \n","90.2800 | \n","14.110000 | \n","4.35000 | \n","90.090 | \n","Patients | \n","
116 rows × 10 columns
\n","\n"," | Age | \n","BMI | \n","Glucose | \n","Insulin | \n","HOMA | \n","Leptin | \n","Adiponectin | \n","Resistin | \n","MCP.1 | \n","
---|---|---|---|---|---|---|---|---|---|
0 | \n","48 | \n","23.500000 | \n","70 | \n","2.707 | \n","0.467409 | \n","8.8071 | \n","9.702400 | \n","7.99585 | \n","417.114 | \n","
1 | \n","83 | \n","20.690495 | \n","92 | \n","3.115 | \n","0.706897 | \n","8.8438 | \n","5.429285 | \n","4.06405 | \n","468.786 | \n","
2 | \n","82 | \n","23.124670 | \n","91 | \n","4.498 | \n","1.009651 | \n","17.9393 | \n","22.432040 | \n","9.27715 | \n","554.697 | \n","
3 | \n","68 | \n","21.367521 | \n","77 | \n","3.226 | \n","0.612725 | \n","9.8827 | \n","7.169560 | \n","12.76600 | \n","928.220 | \n","
4 | \n","86 | \n","21.111111 | \n","92 | \n","3.549 | \n","0.805386 | \n","6.6994 | \n","4.819240 | \n","10.57635 | \n","773.920 | \n","
\n"," | Age | \n","BMI | \n","Glucose | \n","Insulin | \n","HOMA | \n","Leptin | \n","Adiponectin | \n","Resistin | \n","MCP.1 | \n","Classification | \n","
---|---|---|---|---|---|---|---|---|---|---|
0 | \n","48 | \n","23.500000 | \n","70 | \n","2.707 | \n","0.467409 | \n","8.8071 | \n","9.702400 | \n","7.99585 | \n","417.114 | \n","1 | \n","
1 | \n","83 | \n","20.690495 | \n","92 | \n","3.115 | \n","0.706897 | \n","8.8438 | \n","5.429285 | \n","4.06405 | \n","468.786 | \n","1 | \n","
2 | \n","82 | \n","23.124670 | \n","91 | \n","4.498 | \n","1.009651 | \n","17.9393 | \n","22.432040 | \n","9.27715 | \n","554.697 | \n","1 | \n","
3 | \n","68 | \n","21.367521 | \n","77 | \n","3.226 | \n","0.612725 | \n","9.8827 | \n","7.169560 | \n","12.76600 | \n","928.220 | \n","1 | \n","
4 | \n","86 | \n","21.111111 | \n","92 | \n","3.549 | \n","0.805386 | \n","6.6994 | \n","4.819240 | \n","10.57635 | \n","773.920 | \n","1 | \n","
... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","... | \n","
111 | \n","45 | \n","26.850000 | \n","92 | \n","3.330 | \n","0.755688 | \n","54.6800 | \n","12.100000 | \n","10.96000 | \n","268.230 | \n","2 | \n","
112 | \n","62 | \n","26.840000 | \n","100 | \n","4.530 | \n","1.117400 | \n","12.4500 | \n","21.420000 | \n","7.32000 | \n","330.160 | \n","2 | \n","
113 | \n","65 | \n","32.050000 | \n","97 | \n","5.730 | \n","1.370998 | \n","61.4800 | \n","22.540000 | \n","10.33000 | \n","314.050 | \n","2 | \n","
114 | \n","72 | \n","25.590000 | \n","82 | \n","2.820 | \n","0.570392 | \n","24.9600 | \n","33.750000 | \n","3.27000 | \n","392.460 | \n","2 | \n","
115 | \n","86 | \n","27.180000 | \n","138 | \n","19.910 | \n","6.777364 | \n","90.2800 | \n","14.110000 | \n","4.35000 | \n","90.090 | \n","2 | \n","
116 rows × 10 columns
\n","