From 13a8a7ddcd1c8129370559c0418d1d36276d7d71 Mon Sep 17 00:00:00 2001
From: Arindam Sahoo <88739246+arindam-sahoo@users.noreply.github.com>
Date: Mon, 24 Jun 2024 14:06:38 +0530
Subject: [PATCH] Add files via upload

---
 breast-cancer-detection-using-various-algorithms.ipynb | 1 +
 1 file changed, 1 insertion(+)
 create mode 100644 breast-cancer-detection-using-various-algorithms.ipynb

diff --git a/breast-cancer-detection-using-various-algorithms.ipynb b/breast-cancer-detection-using-various-algorithms.ipynb
new file mode 100644
index 0000000..a0b0db9
--- /dev/null
+++ b/breast-cancer-detection-using-various-algorithms.ipynb
@@ -0,0 +1 @@
+{"metadata":{"kernelspec":{"language":"python","display_name":"Python 3","name":"python3"},"language_info":{"name":"python","version":"3.10.13","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"none","dataSources":[{"sourceId":2984728,"sourceType":"datasetVersion","datasetId":1829286}],"dockerImageVersionId":30732,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":false}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"code","source":"# This Python 3 environment comes with many helpful analytics libraries installed\n# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python\n# For example, here's several helpful packages to load\n\nimport numpy as np # linear algebra\nimport pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)\nimport sklearn.datasets","metadata":{"_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","execution":{"iopub.status.busy":"2024-06-24T08:32:29.769529Z","iopub.execute_input":"2024-06-24T08:32:29.770856Z","iopub.status.idle":"2024-06-24T08:32:29.777355Z","shell.execute_reply.started":"2024-06-24T08:32:29.770763Z","shell.execute_reply":"2024-06-24T08:32:29.776088Z"},"trusted":true},"execution_count":84,"outputs":[]},{"cell_type":"markdown","source":"**Loading the dataset in a Pandas Dataframe**","metadata":{}},{"cell_type":"code","source":"breast_cancer = sklearn.datasets.load_breast_cancer()","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.779501Z","iopub.execute_input":"2024-06-24T08:32:29.779951Z","iopub.status.idle":"2024-06-24T08:32:29.801645Z","shell.execute_reply.started":"2024-06-24T08:32:29.779911Z","shell.execute_reply":"2024-06-24T08:32:29.800338Z"},"trusted":true},"execution_count":85,"outputs":[]},{"cell_type":"code","source":"breast_cancer","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.803388Z","iopub.execute_input":"2024-06-24T08:32:29.804481Z","iopub.status.idle":"2024-06-24T08:32:29.815681Z","shell.execute_reply.started":"2024-06-24T08:32:29.804443Z","shell.execute_reply":"2024-06-24T08:32:29.814392Z"},"trusted":true},"execution_count":86,"outputs":[{"execution_count":86,"output_type":"execute_result","data":{"text/plain":"{'data': array([[1.799e+01, 1.038e+01, 1.228e+02, ..., 2.654e-01, 4.601e-01,\n         1.189e-01],\n        [2.057e+01, 1.777e+01, 1.329e+02, ..., 1.860e-01, 2.750e-01,\n         8.902e-02],\n        [1.969e+01, 2.125e+01, 1.300e+02, ..., 2.430e-01, 3.613e-01,\n         8.758e-02],\n        ...,\n        [1.660e+01, 2.808e+01, 1.083e+02, ..., 1.418e-01, 2.218e-01,\n         7.820e-02],\n        [2.060e+01, 2.933e+01, 1.401e+02, ..., 2.650e-01, 4.087e-01,\n         1.240e-01],\n        [7.760e+00, 2.454e+01, 4.792e+01, ..., 0.000e+00, 2.871e-01,\n         7.039e-02]]),\n 'target': array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1,\n        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0,\n        0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0,\n        1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0,\n        1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1,\n        1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0,\n        0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1,\n        1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1,\n        1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0,\n        0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0,\n        1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1,\n        1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n        0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1,\n        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1,\n        1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0,\n        0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0,\n        0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0,\n        1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1,\n        1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0,\n        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1,\n        1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0,\n        1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1,\n        1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1,\n        1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1,\n        1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1]),\n 'frame': None,\n 'target_names': array(['malignant', 'benign'], dtype='<U9'),\n 'DESCR': '.. _breast_cancer_dataset:\\n\\nBreast cancer wisconsin (diagnostic) dataset\\n--------------------------------------------\\n\\n**Data Set Characteristics:**\\n\\n    :Number of Instances: 569\\n\\n    :Number of Attributes: 30 numeric, predictive attributes and the class\\n\\n    :Attribute Information:\\n        - radius (mean of distances from center to points on the perimeter)\\n        - texture (standard deviation of gray-scale values)\\n        - perimeter\\n        - area\\n        - smoothness (local variation in radius lengths)\\n        - compactness (perimeter^2 / area - 1.0)\\n        - concavity (severity of concave portions of the contour)\\n        - concave points (number of concave portions of the contour)\\n        - symmetry\\n        - fractal dimension (\"coastline approximation\" - 1)\\n\\n        The mean, standard error, and \"worst\" or largest (mean of the three\\n        worst/largest values) of these features were computed for each image,\\n        resulting in 30 features.  For instance, field 0 is Mean Radius, field\\n        10 is Radius SE, field 20 is Worst Radius.\\n\\n        - class:\\n                - WDBC-Malignant\\n                - WDBC-Benign\\n\\n    :Summary Statistics:\\n\\n    ===================================== ====== ======\\n                                           Min    Max\\n    ===================================== ====== ======\\n    radius (mean):                        6.981  28.11\\n    texture (mean):                       9.71   39.28\\n    perimeter (mean):                     43.79  188.5\\n    area (mean):                          143.5  2501.0\\n    smoothness (mean):                    0.053  0.163\\n    compactness (mean):                   0.019  0.345\\n    concavity (mean):                     0.0    0.427\\n    concave points (mean):                0.0    0.201\\n    symmetry (mean):                      0.106  0.304\\n    fractal dimension (mean):             0.05   0.097\\n    radius (standard error):              0.112  2.873\\n    texture (standard error):             0.36   4.885\\n    perimeter (standard error):           0.757  21.98\\n    area (standard error):                6.802  542.2\\n    smoothness (standard error):          0.002  0.031\\n    compactness (standard error):         0.002  0.135\\n    concavity (standard error):           0.0    0.396\\n    concave points (standard error):      0.0    0.053\\n    symmetry (standard error):            0.008  0.079\\n    fractal dimension (standard error):   0.001  0.03\\n    radius (worst):                       7.93   36.04\\n    texture (worst):                      12.02  49.54\\n    perimeter (worst):                    50.41  251.2\\n    area (worst):                         185.2  4254.0\\n    smoothness (worst):                   0.071  0.223\\n    compactness (worst):                  0.027  1.058\\n    concavity (worst):                    0.0    1.252\\n    concave points (worst):               0.0    0.291\\n    symmetry (worst):                     0.156  0.664\\n    fractal dimension (worst):            0.055  0.208\\n    ===================================== ====== ======\\n\\n    :Missing Attribute Values: None\\n\\n    :Class Distribution: 212 - Malignant, 357 - Benign\\n\\n    :Creator:  Dr. William H. Wolberg, W. Nick Street, Olvi L. Mangasarian\\n\\n    :Donor: Nick Street\\n\\n    :Date: November, 1995\\n\\nThis is a copy of UCI ML Breast Cancer Wisconsin (Diagnostic) datasets.\\nhttps://goo.gl/U2Uwz2\\n\\nFeatures are computed from a digitized image of a fine needle\\naspirate (FNA) of a breast mass.  They describe\\ncharacteristics of the cell nuclei present in the image.\\n\\nSeparating plane described above was obtained using\\nMultisurface Method-Tree (MSM-T) [K. P. Bennett, \"Decision Tree\\nConstruction Via Linear Programming.\" Proceedings of the 4th\\nMidwest Artificial Intelligence and Cognitive Science Society,\\npp. 97-101, 1992], a classification method which uses linear\\nprogramming to construct a decision tree.  Relevant features\\nwere selected using an exhaustive search in the space of 1-4\\nfeatures and 1-3 separating planes.\\n\\nThe actual linear program used to obtain the separating plane\\nin the 3-dimensional space is that described in:\\n[K. P. Bennett and O. L. Mangasarian: \"Robust Linear\\nProgramming Discrimination of Two Linearly Inseparable Sets\",\\nOptimization Methods and Software 1, 1992, 23-34].\\n\\nThis database is also available through the UW CS ftp server:\\n\\nftp ftp.cs.wisc.edu\\ncd math-prog/cpo-dataset/machine-learn/WDBC/\\n\\n.. topic:: References\\n\\n   - W.N. Street, W.H. Wolberg and O.L. Mangasarian. Nuclear feature extraction \\n     for breast tumor diagnosis. IS&T/SPIE 1993 International Symposium on \\n     Electronic Imaging: Science and Technology, volume 1905, pages 861-870,\\n     San Jose, CA, 1993.\\n   - O.L. Mangasarian, W.N. Street and W.H. Wolberg. Breast cancer diagnosis and \\n     prognosis via linear programming. Operations Research, 43(4), pages 570-577, \\n     July-August 1995.\\n   - W.H. Wolberg, W.N. Street, and O.L. Mangasarian. Machine learning techniques\\n     to diagnose breast cancer from fine-needle aspirates. Cancer Letters 77 (1994) \\n     163-171.',\n 'feature_names': array(['mean radius', 'mean texture', 'mean perimeter', 'mean area',\n        'mean smoothness', 'mean compactness', 'mean concavity',\n        'mean concave points', 'mean symmetry', 'mean fractal dimension',\n        'radius error', 'texture error', 'perimeter error', 'area error',\n        'smoothness error', 'compactness error', 'concavity error',\n        'concave points error', 'symmetry error',\n        'fractal dimension error', 'worst radius', 'worst texture',\n        'worst perimeter', 'worst area', 'worst smoothness',\n        'worst compactness', 'worst concavity', 'worst concave points',\n        'worst symmetry', 'worst fractal dimension'], dtype='<U23'),\n 'filename': 'breast_cancer.csv',\n 'data_module': 'sklearn.datasets.data'}"},"metadata":{}}]},{"cell_type":"code","source":"X = breast_cancer.data\nY = breast_cancer.target","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.817418Z","iopub.execute_input":"2024-06-24T08:32:29.818334Z","iopub.status.idle":"2024-06-24T08:32:29.830358Z","shell.execute_reply.started":"2024-06-24T08:32:29.818285Z","shell.execute_reply":"2024-06-24T08:32:29.829100Z"},"trusted":true},"execution_count":87,"outputs":[]},{"cell_type":"code","source":"X","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.833277Z","iopub.execute_input":"2024-06-24T08:32:29.834202Z","iopub.status.idle":"2024-06-24T08:32:29.844110Z","shell.execute_reply.started":"2024-06-24T08:32:29.834153Z","shell.execute_reply":"2024-06-24T08:32:29.842765Z"},"trusted":true},"execution_count":88,"outputs":[{"execution_count":88,"output_type":"execute_result","data":{"text/plain":"array([[1.799e+01, 1.038e+01, 1.228e+02, ..., 2.654e-01, 4.601e-01,\n        1.189e-01],\n       [2.057e+01, 1.777e+01, 1.329e+02, ..., 1.860e-01, 2.750e-01,\n        8.902e-02],\n       [1.969e+01, 2.125e+01, 1.300e+02, ..., 2.430e-01, 3.613e-01,\n        8.758e-02],\n       ...,\n       [1.660e+01, 2.808e+01, 1.083e+02, ..., 1.418e-01, 2.218e-01,\n        7.820e-02],\n       [2.060e+01, 2.933e+01, 1.401e+02, ..., 2.650e-01, 4.087e-01,\n        1.240e-01],\n       [7.760e+00, 2.454e+01, 4.792e+01, ..., 0.000e+00, 2.871e-01,\n        7.039e-02]])"},"metadata":{}}]},{"cell_type":"code","source":"Y","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.845470Z","iopub.execute_input":"2024-06-24T08:32:29.846142Z","iopub.status.idle":"2024-06-24T08:32:29.855383Z","shell.execute_reply.started":"2024-06-24T08:32:29.846109Z","shell.execute_reply":"2024-06-24T08:32:29.854255Z"},"trusted":true},"execution_count":89,"outputs":[{"execution_count":89,"output_type":"execute_result","data":{"text/plain":"array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1,\n       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0,\n       0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0,\n       1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0,\n       1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1,\n       1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0,\n       0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1,\n       1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1,\n       1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0,\n       0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0,\n       1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1,\n       1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n       0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1,\n       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1,\n       1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0,\n       0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0,\n       0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0,\n       1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1,\n       1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0,\n       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1,\n       1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0,\n       1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1,\n       1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1,\n       1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1,\n       1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1])"},"metadata":{}}]},{"cell_type":"code","source":"print(X.shape, Y.shape)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.857114Z","iopub.execute_input":"2024-06-24T08:32:29.857661Z","iopub.status.idle":"2024-06-24T08:32:29.866377Z","shell.execute_reply.started":"2024-06-24T08:32:29.857616Z","shell.execute_reply":"2024-06-24T08:32:29.865091Z"},"trusted":true},"execution_count":90,"outputs":[{"name":"stdout","text":"(569, 30) (569,)\n","output_type":"stream"}]},{"cell_type":"code","source":"df = pd.DataFrame(breast_cancer.data, columns = breast_cancer.feature_names)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.868337Z","iopub.execute_input":"2024-06-24T08:32:29.869142Z","iopub.status.idle":"2024-06-24T08:32:29.877855Z","shell.execute_reply.started":"2024-06-24T08:32:29.869095Z","shell.execute_reply":"2024-06-24T08:32:29.876520Z"},"trusted":true},"execution_count":91,"outputs":[]},{"cell_type":"code","source":"df['class'] =  breast_cancer.target","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.880300Z","iopub.execute_input":"2024-06-24T08:32:29.880727Z","iopub.status.idle":"2024-06-24T08:32:29.889898Z","shell.execute_reply.started":"2024-06-24T08:32:29.880686Z","shell.execute_reply":"2024-06-24T08:32:29.888549Z"},"trusted":true},"execution_count":92,"outputs":[]},{"cell_type":"code","source":"df","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.891537Z","iopub.execute_input":"2024-06-24T08:32:29.892284Z","iopub.status.idle":"2024-06-24T08:32:29.932736Z","shell.execute_reply.started":"2024-06-24T08:32:29.892235Z","shell.execute_reply":"2024-06-24T08:32:29.931399Z"},"trusted":true},"execution_count":93,"outputs":[{"execution_count":93,"output_type":"execute_result","data":{"text/plain":"     mean radius  mean texture  mean perimeter  mean area  mean smoothness  \\\n0          17.99         10.38          122.80     1001.0          0.11840   \n1          20.57         17.77          132.90     1326.0          0.08474   \n2          19.69         21.25          130.00     1203.0          0.10960   \n3          11.42         20.38           77.58      386.1          0.14250   \n4          20.29         14.34          135.10     1297.0          0.10030   \n..           ...           ...             ...        ...              ...   \n564        21.56         22.39          142.00     1479.0          0.11100   \n565        20.13         28.25          131.20     1261.0          0.09780   \n566        16.60         28.08          108.30      858.1          0.08455   \n567        20.60         29.33          140.10     1265.0          0.11780   \n568         7.76         24.54           47.92      181.0          0.05263   \n\n     mean compactness  mean concavity  mean concave points  mean symmetry  \\\n0             0.27760         0.30010              0.14710         0.2419   \n1             0.07864         0.08690              0.07017         0.1812   \n2             0.15990         0.19740              0.12790         0.2069   \n3             0.28390         0.24140              0.10520         0.2597   \n4             0.13280         0.19800              0.10430         0.1809   \n..                ...             ...                  ...            ...   \n564           0.11590         0.24390              0.13890         0.1726   \n565           0.10340         0.14400              0.09791         0.1752   \n566           0.10230         0.09251              0.05302         0.1590   \n567           0.27700         0.35140              0.15200         0.2397   \n568           0.04362         0.00000              0.00000         0.1587   \n\n     mean fractal dimension  ...  worst texture  worst perimeter  worst area  \\\n0                   0.07871  ...          17.33           184.60      2019.0   \n1                   0.05667  ...          23.41           158.80      1956.0   \n2                   0.05999  ...          25.53           152.50      1709.0   \n3                   0.09744  ...          26.50            98.87       567.7   \n4                   0.05883  ...          16.67           152.20      1575.0   \n..                      ...  ...            ...              ...         ...   \n564                 0.05623  ...          26.40           166.10      2027.0   \n565                 0.05533  ...          38.25           155.00      1731.0   \n566                 0.05648  ...          34.12           126.70      1124.0   \n567                 0.07016  ...          39.42           184.60      1821.0   \n568                 0.05884  ...          30.37            59.16       268.6   \n\n     worst smoothness  worst compactness  worst concavity  \\\n0             0.16220            0.66560           0.7119   \n1             0.12380            0.18660           0.2416   \n2             0.14440            0.42450           0.4504   \n3             0.20980            0.86630           0.6869   \n4             0.13740            0.20500           0.4000   \n..                ...                ...              ...   \n564           0.14100            0.21130           0.4107   \n565           0.11660            0.19220           0.3215   \n566           0.11390            0.30940           0.3403   \n567           0.16500            0.86810           0.9387   \n568           0.08996            0.06444           0.0000   \n\n     worst concave points  worst symmetry  worst fractal dimension  class  \n0                  0.2654          0.4601                  0.11890      0  \n1                  0.1860          0.2750                  0.08902      0  \n2                  0.2430          0.3613                  0.08758      0  \n3                  0.2575          0.6638                  0.17300      0  \n4                  0.1625          0.2364                  0.07678      0  \n..                    ...             ...                      ...    ...  \n564                0.2216          0.2060                  0.07115      0  \n565                0.1628          0.2572                  0.06637      0  \n566                0.1418          0.2218                  0.07820      0  \n567                0.2650          0.4087                  0.12400      0  \n568                0.0000          0.2871                  0.07039      1  \n\n[569 rows x 31 columns]","text/html":"<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>mean radius</th>\n      <th>mean texture</th>\n      <th>mean perimeter</th>\n      <th>mean area</th>\n      <th>mean smoothness</th>\n      <th>mean compactness</th>\n      <th>mean concavity</th>\n      <th>mean concave points</th>\n      <th>mean symmetry</th>\n      <th>mean fractal dimension</th>\n      <th>...</th>\n      <th>worst texture</th>\n      <th>worst perimeter</th>\n      <th>worst area</th>\n      <th>worst smoothness</th>\n      <th>worst compactness</th>\n      <th>worst concavity</th>\n      <th>worst concave points</th>\n      <th>worst symmetry</th>\n      <th>worst fractal dimension</th>\n      <th>class</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>17.99</td>\n      <td>10.38</td>\n      <td>122.80</td>\n      <td>1001.0</td>\n      <td>0.11840</td>\n      <td>0.27760</td>\n      <td>0.30010</td>\n      <td>0.14710</td>\n      <td>0.2419</td>\n      <td>0.07871</td>\n      <td>...</td>\n      <td>17.33</td>\n      <td>184.60</td>\n      <td>2019.0</td>\n      <td>0.16220</td>\n      <td>0.66560</td>\n      <td>0.7119</td>\n      <td>0.2654</td>\n      <td>0.4601</td>\n      <td>0.11890</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>20.57</td>\n      <td>17.77</td>\n      <td>132.90</td>\n      <td>1326.0</td>\n      <td>0.08474</td>\n      <td>0.07864</td>\n      <td>0.08690</td>\n      <td>0.07017</td>\n      <td>0.1812</td>\n      <td>0.05667</td>\n      <td>...</td>\n      <td>23.41</td>\n      <td>158.80</td>\n      <td>1956.0</td>\n      <td>0.12380</td>\n      <td>0.18660</td>\n      <td>0.2416</td>\n      <td>0.1860</td>\n      <td>0.2750</td>\n      <td>0.08902</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>19.69</td>\n      <td>21.25</td>\n      <td>130.00</td>\n      <td>1203.0</td>\n      <td>0.10960</td>\n      <td>0.15990</td>\n      <td>0.19740</td>\n      <td>0.12790</td>\n      <td>0.2069</td>\n      <td>0.05999</td>\n      <td>...</td>\n      <td>25.53</td>\n      <td>152.50</td>\n      <td>1709.0</td>\n      <td>0.14440</td>\n      <td>0.42450</td>\n      <td>0.4504</td>\n      <td>0.2430</td>\n      <td>0.3613</td>\n      <td>0.08758</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>11.42</td>\n      <td>20.38</td>\n      <td>77.58</td>\n      <td>386.1</td>\n      <td>0.14250</td>\n      <td>0.28390</td>\n      <td>0.24140</td>\n      <td>0.10520</td>\n      <td>0.2597</td>\n      <td>0.09744</td>\n      <td>...</td>\n      <td>26.50</td>\n      <td>98.87</td>\n      <td>567.7</td>\n      <td>0.20980</td>\n      <td>0.86630</td>\n      <td>0.6869</td>\n      <td>0.2575</td>\n      <td>0.6638</td>\n      <td>0.17300</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>20.29</td>\n      <td>14.34</td>\n      <td>135.10</td>\n      <td>1297.0</td>\n      <td>0.10030</td>\n      <td>0.13280</td>\n      <td>0.19800</td>\n      <td>0.10430</td>\n      <td>0.1809</td>\n      <td>0.05883</td>\n      <td>...</td>\n      <td>16.67</td>\n      <td>152.20</td>\n      <td>1575.0</td>\n      <td>0.13740</td>\n      <td>0.20500</td>\n      <td>0.4000</td>\n      <td>0.1625</td>\n      <td>0.2364</td>\n      <td>0.07678</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>...</th>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n    </tr>\n    <tr>\n      <th>564</th>\n      <td>21.56</td>\n      <td>22.39</td>\n      <td>142.00</td>\n      <td>1479.0</td>\n      <td>0.11100</td>\n      <td>0.11590</td>\n      <td>0.24390</td>\n      <td>0.13890</td>\n      <td>0.1726</td>\n      <td>0.05623</td>\n      <td>...</td>\n      <td>26.40</td>\n      <td>166.10</td>\n      <td>2027.0</td>\n      <td>0.14100</td>\n      <td>0.21130</td>\n      <td>0.4107</td>\n      <td>0.2216</td>\n      <td>0.2060</td>\n      <td>0.07115</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>565</th>\n      <td>20.13</td>\n      <td>28.25</td>\n      <td>131.20</td>\n      <td>1261.0</td>\n      <td>0.09780</td>\n      <td>0.10340</td>\n      <td>0.14400</td>\n      <td>0.09791</td>\n      <td>0.1752</td>\n      <td>0.05533</td>\n      <td>...</td>\n      <td>38.25</td>\n      <td>155.00</td>\n      <td>1731.0</td>\n      <td>0.11660</td>\n      <td>0.19220</td>\n      <td>0.3215</td>\n      <td>0.1628</td>\n      <td>0.2572</td>\n      <td>0.06637</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>566</th>\n      <td>16.60</td>\n      <td>28.08</td>\n      <td>108.30</td>\n      <td>858.1</td>\n      <td>0.08455</td>\n      <td>0.10230</td>\n      <td>0.09251</td>\n      <td>0.05302</td>\n      <td>0.1590</td>\n      <td>0.05648</td>\n      <td>...</td>\n      <td>34.12</td>\n      <td>126.70</td>\n      <td>1124.0</td>\n      <td>0.11390</td>\n      <td>0.30940</td>\n      <td>0.3403</td>\n      <td>0.1418</td>\n      <td>0.2218</td>\n      <td>0.07820</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>567</th>\n      <td>20.60</td>\n      <td>29.33</td>\n      <td>140.10</td>\n      <td>1265.0</td>\n      <td>0.11780</td>\n      <td>0.27700</td>\n      <td>0.35140</td>\n      <td>0.15200</td>\n      <td>0.2397</td>\n      <td>0.07016</td>\n      <td>...</td>\n      <td>39.42</td>\n      <td>184.60</td>\n      <td>1821.0</td>\n      <td>0.16500</td>\n      <td>0.86810</td>\n      <td>0.9387</td>\n      <td>0.2650</td>\n      <td>0.4087</td>\n      <td>0.12400</td>\n      <td>0</td>\n    </tr>\n    <tr>\n      <th>568</th>\n      <td>7.76</td>\n      <td>24.54</td>\n      <td>47.92</td>\n      <td>181.0</td>\n      <td>0.05263</td>\n      <td>0.04362</td>\n      <td>0.00000</td>\n      <td>0.00000</td>\n      <td>0.1587</td>\n      <td>0.05884</td>\n      <td>...</td>\n      <td>30.37</td>\n      <td>59.16</td>\n      <td>268.6</td>\n      <td>0.08996</td>\n      <td>0.06444</td>\n      <td>0.0000</td>\n      <td>0.0000</td>\n      <td>0.2871</td>\n      <td>0.07039</td>\n      <td>1</td>\n    </tr>\n  </tbody>\n</table>\n<p>569 rows × 31 columns</p>\n</div>"},"metadata":{}}]},{"cell_type":"code","source":"print(breast_cancer.target_names)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.934362Z","iopub.execute_input":"2024-06-24T08:32:29.934862Z","iopub.status.idle":"2024-06-24T08:32:29.943888Z","shell.execute_reply.started":"2024-06-24T08:32:29.934819Z","shell.execute_reply":"2024-06-24T08:32:29.942488Z"},"trusted":true},"execution_count":94,"outputs":[{"name":"stdout","text":"['malignant' 'benign']\n","output_type":"stream"}]},{"cell_type":"code","source":"df.groupby('class').mean()\n#0 = malignant\n#1 = benign","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.945523Z","iopub.execute_input":"2024-06-24T08:32:29.946053Z","iopub.status.idle":"2024-06-24T08:32:29.977139Z","shell.execute_reply.started":"2024-06-24T08:32:29.946009Z","shell.execute_reply":"2024-06-24T08:32:29.975901Z"},"trusted":true},"execution_count":95,"outputs":[{"execution_count":95,"output_type":"execute_result","data":{"text/plain":"       mean radius  mean texture  mean perimeter   mean area  mean smoothness  \\\nclass                                                                           \n0        17.462830     21.604906      115.365377  978.376415         0.102898   \n1        12.146524     17.914762       78.075406  462.790196         0.092478   \n\n       mean compactness  mean concavity  mean concave points  mean symmetry  \\\nclass                                                                         \n0              0.145188        0.160775             0.087990       0.192909   \n1              0.080085        0.046058             0.025717       0.174186   \n\n       mean fractal dimension  ...  worst radius  worst texture  \\\nclass                          ...                                \n0                    0.062680  ...     21.134811      29.318208   \n1                    0.062867  ...     13.379801      23.515070   \n\n       worst perimeter   worst area  worst smoothness  worst compactness  \\\nclass                                                                      \n0           141.370330  1422.286321          0.144845           0.374824   \n1            87.005938   558.899440          0.124959           0.182673   \n\n       worst concavity  worst concave points  worst symmetry  \\\nclass                                                          \n0             0.450606              0.182237        0.323468   \n1             0.166238              0.074444        0.270246   \n\n       worst fractal dimension  \nclass                           \n0                     0.091530  \n1                     0.079442  \n\n[2 rows x 30 columns]","text/html":"<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>mean radius</th>\n      <th>mean texture</th>\n      <th>mean perimeter</th>\n      <th>mean area</th>\n      <th>mean smoothness</th>\n      <th>mean compactness</th>\n      <th>mean concavity</th>\n      <th>mean concave points</th>\n      <th>mean symmetry</th>\n      <th>mean fractal dimension</th>\n      <th>...</th>\n      <th>worst radius</th>\n      <th>worst texture</th>\n      <th>worst perimeter</th>\n      <th>worst area</th>\n      <th>worst smoothness</th>\n      <th>worst compactness</th>\n      <th>worst concavity</th>\n      <th>worst concave points</th>\n      <th>worst symmetry</th>\n      <th>worst fractal dimension</th>\n    </tr>\n    <tr>\n      <th>class</th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n      <th></th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>17.462830</td>\n      <td>21.604906</td>\n      <td>115.365377</td>\n      <td>978.376415</td>\n      <td>0.102898</td>\n      <td>0.145188</td>\n      <td>0.160775</td>\n      <td>0.087990</td>\n      <td>0.192909</td>\n      <td>0.062680</td>\n      <td>...</td>\n      <td>21.134811</td>\n      <td>29.318208</td>\n      <td>141.370330</td>\n      <td>1422.286321</td>\n      <td>0.144845</td>\n      <td>0.374824</td>\n      <td>0.450606</td>\n      <td>0.182237</td>\n      <td>0.323468</td>\n      <td>0.091530</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>12.146524</td>\n      <td>17.914762</td>\n      <td>78.075406</td>\n      <td>462.790196</td>\n      <td>0.092478</td>\n      <td>0.080085</td>\n      <td>0.046058</td>\n      <td>0.025717</td>\n      <td>0.174186</td>\n      <td>0.062867</td>\n      <td>...</td>\n      <td>13.379801</td>\n      <td>23.515070</td>\n      <td>87.005938</td>\n      <td>558.899440</td>\n      <td>0.124959</td>\n      <td>0.182673</td>\n      <td>0.166238</td>\n      <td>0.074444</td>\n      <td>0.270246</td>\n      <td>0.079442</td>\n    </tr>\n  </tbody>\n</table>\n<p>2 rows × 30 columns</p>\n</div>"},"metadata":{}}]},{"cell_type":"markdown","source":"**Train and Test Data Split**","metadata":{}},{"cell_type":"code","source":"from sklearn.model_selection import train_test_split\nX_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, stratify=Y, random_state=42)\n#stratify --> for correct distribution of data as of the original data\n#random_state --> specific split of data, each value of random_state splits the data differently","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.978542Z","iopub.execute_input":"2024-06-24T08:32:29.978958Z","iopub.status.idle":"2024-06-24T08:32:29.989465Z","shell.execute_reply.started":"2024-06-24T08:32:29.978919Z","shell.execute_reply":"2024-06-24T08:32:29.988222Z"},"trusted":true},"execution_count":96,"outputs":[]},{"cell_type":"code","source":"print(Y.shape, Y_train.shape, Y_test.shape)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:29.995241Z","iopub.execute_input":"2024-06-24T08:32:29.996307Z","iopub.status.idle":"2024-06-24T08:32:30.002447Z","shell.execute_reply.started":"2024-06-24T08:32:29.996255Z","shell.execute_reply":"2024-06-24T08:32:30.001250Z"},"trusted":true},"execution_count":97,"outputs":[{"name":"stdout","text":"(569,) (455,) (114,)\n","output_type":"stream"}]},{"cell_type":"code","source":"print(X_train.mean(), X_test.mean(), X.mean())","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.003703Z","iopub.execute_input":"2024-06-24T08:32:30.004058Z","iopub.status.idle":"2024-06-24T08:32:30.014110Z","shell.execute_reply.started":"2024-06-24T08:32:30.004029Z","shell.execute_reply":"2024-06-24T08:32:30.012490Z"},"trusted":true},"execution_count":98,"outputs":[{"name":"stdout","text":"61.21359590991941 64.59323844011696 61.890712339519624\n","output_type":"stream"}]},{"cell_type":"markdown","source":"## **Logistic Regression**","metadata":{}},{"cell_type":"code","source":"#import logistic regression from sklearn\nfrom sklearn.linear_model import LogisticRegression","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.015373Z","iopub.execute_input":"2024-06-24T08:32:30.015776Z","iopub.status.idle":"2024-06-24T08:32:30.029406Z","shell.execute_reply.started":"2024-06-24T08:32:30.015747Z","shell.execute_reply":"2024-06-24T08:32:30.027816Z"},"trusted":true},"execution_count":99,"outputs":[]},{"cell_type":"code","source":"classifier = LogisticRegression()","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.030892Z","iopub.execute_input":"2024-06-24T08:32:30.033226Z","iopub.status.idle":"2024-06-24T08:32:30.041930Z","shell.execute_reply.started":"2024-06-24T08:32:30.033165Z","shell.execute_reply":"2024-06-24T08:32:30.040010Z"},"trusted":true},"execution_count":100,"outputs":[]},{"cell_type":"code","source":"#training the model on training data\nclassifier.fit(X_train, Y_train)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.044236Z","iopub.execute_input":"2024-06-24T08:32:30.044799Z","iopub.status.idle":"2024-06-24T08:32:30.121502Z","shell.execute_reply.started":"2024-06-24T08:32:30.044758Z","shell.execute_reply":"2024-06-24T08:32:30.120260Z"},"trusted":true},"execution_count":101,"outputs":[{"name":"stderr","text":"/opt/conda/lib/python3.10/site-packages/sklearn/linear_model/_logistic.py:458: ConvergenceWarning: lbfgs failed to converge (status=1):\nSTOP: TOTAL NO. of ITERATIONS REACHED LIMIT.\n\nIncrease the number of iterations (max_iter) or scale the data as shown in:\n    https://scikit-learn.org/stable/modules/preprocessing.html\nPlease also refer to the documentation for alternative solver options:\n    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression\n  n_iter_i = _check_optimize_result(\n","output_type":"stream"},{"execution_count":101,"output_type":"execute_result","data":{"text/plain":"LogisticRegression()","text/html":"<style>#sk-container-id-5 {color: black;background-color: white;}#sk-container-id-5 pre{padding: 0;}#sk-container-id-5 div.sk-toggleable {background-color: white;}#sk-container-id-5 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-5 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-5 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-5 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-5 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-5 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-5 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-5 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-5 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-5 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-5 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-5 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-5 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-5 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-5 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-5 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-5 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-5 div.sk-item {position: relative;z-index: 1;}#sk-container-id-5 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-5 div.sk-item::before, #sk-container-id-5 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-5 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-5 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-5 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-5 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-5 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-5 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-5 div.sk-label-container {text-align: center;}#sk-container-id-5 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-5 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-5\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>LogisticRegression()</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-5\" type=\"checkbox\" checked><label for=\"sk-estimator-id-5\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">LogisticRegression</label><div class=\"sk-toggleable__content\"><pre>LogisticRegression()</pre></div></div></div></div></div>"},"metadata":{}}]},{"cell_type":"code","source":"#import accuracy_score\nfrom sklearn.metrics import accuracy_score, confusion_matrix, classification_report","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.123112Z","iopub.execute_input":"2024-06-24T08:32:30.124346Z","iopub.status.idle":"2024-06-24T08:32:30.130323Z","shell.execute_reply.started":"2024-06-24T08:32:30.124304Z","shell.execute_reply":"2024-06-24T08:32:30.128660Z"},"trusted":true},"execution_count":102,"outputs":[]},{"cell_type":"code","source":"#prediction on test_data\nprediction = classifier.predict(X_test)\naccuracy = accuracy_score(Y_test, prediction)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.131984Z","iopub.execute_input":"2024-06-24T08:32:30.133174Z","iopub.status.idle":"2024-06-24T08:32:30.143408Z","shell.execute_reply.started":"2024-06-24T08:32:30.133120Z","shell.execute_reply":"2024-06-24T08:32:30.141487Z"},"trusted":true},"execution_count":103,"outputs":[]},{"cell_type":"code","source":"# Creating accuracy dictionary\naccuracy_dict = {}\naccuracy_dict['Logistic Regression'] = round((accuracy * 100),2)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.145736Z","iopub.execute_input":"2024-06-24T08:32:30.147438Z","iopub.status.idle":"2024-06-24T08:32:30.153917Z","shell.execute_reply.started":"2024-06-24T08:32:30.147388Z","shell.execute_reply":"2024-06-24T08:32:30.152543Z"},"trusted":true},"execution_count":104,"outputs":[]},{"cell_type":"code","source":"print(f'Accuracy: {accuracy}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.156317Z","iopub.execute_input":"2024-06-24T08:32:30.158114Z","iopub.status.idle":"2024-06-24T08:32:30.166258Z","shell.execute_reply.started":"2024-06-24T08:32:30.158065Z","shell.execute_reply":"2024-06-24T08:32:30.164929Z"},"trusted":true},"execution_count":105,"outputs":[{"name":"stdout","text":"Accuracy: 0.9473684210526315\n","output_type":"stream"}]},{"cell_type":"code","source":"accuracy_dict","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.168545Z","iopub.execute_input":"2024-06-24T08:32:30.171022Z","iopub.status.idle":"2024-06-24T08:32:30.179325Z","shell.execute_reply.started":"2024-06-24T08:32:30.170973Z","shell.execute_reply":"2024-06-24T08:32:30.177905Z"},"trusted":true},"execution_count":106,"outputs":[{"execution_count":106,"output_type":"execute_result","data":{"text/plain":"{'Logistic Regression': 94.74}"},"metadata":{}}]},{"cell_type":"code","source":"# Confusion Matrix\nconf_matrix = confusion_matrix(Y_test, prediction)\nprint(f'Confusion Matrix:\\n{conf_matrix}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.181508Z","iopub.execute_input":"2024-06-24T08:32:30.182785Z","iopub.status.idle":"2024-06-24T08:32:30.193209Z","shell.execute_reply.started":"2024-06-24T08:32:30.182730Z","shell.execute_reply":"2024-06-24T08:32:30.191665Z"},"trusted":true},"execution_count":107,"outputs":[{"name":"stdout","text":"Confusion Matrix:\n[[38  4]\n [ 2 70]]\n","output_type":"stream"}]},{"cell_type":"code","source":"# Classification Report\nclass_report = classification_report(Y_test, prediction)\nprint(f'Classification Report:\\n{class_report}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.195311Z","iopub.execute_input":"2024-06-24T08:32:30.196812Z","iopub.status.idle":"2024-06-24T08:32:30.232652Z","shell.execute_reply.started":"2024-06-24T08:32:30.196764Z","shell.execute_reply":"2024-06-24T08:32:30.231131Z"},"trusted":true},"execution_count":108,"outputs":[{"name":"stdout","text":"Classification Report:\n              precision    recall  f1-score   support\n\n           0       0.95      0.90      0.93        42\n           1       0.95      0.97      0.96        72\n\n    accuracy                           0.95       114\n   macro avg       0.95      0.94      0.94       114\nweighted avg       0.95      0.95      0.95       114\n\n","output_type":"stream"}]},{"cell_type":"markdown","source":"## **Support Vector Machine**","metadata":{}},{"cell_type":"code","source":"from sklearn.svm import SVC","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.234861Z","iopub.execute_input":"2024-06-24T08:32:30.236254Z","iopub.status.idle":"2024-06-24T08:32:30.242121Z","shell.execute_reply.started":"2024-06-24T08:32:30.236203Z","shell.execute_reply":"2024-06-24T08:32:30.240920Z"},"trusted":true},"execution_count":109,"outputs":[]},{"cell_type":"code","source":"# Initialize the model\nmodel = SVC(kernel='linear')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.244166Z","iopub.execute_input":"2024-06-24T08:32:30.245508Z","iopub.status.idle":"2024-06-24T08:32:30.253306Z","shell.execute_reply.started":"2024-06-24T08:32:30.245460Z","shell.execute_reply":"2024-06-24T08:32:30.252015Z"},"trusted":true},"execution_count":110,"outputs":[]},{"cell_type":"code","source":"# Train the model\nmodel.fit(X_train, Y_train)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:30.255111Z","iopub.execute_input":"2024-06-24T08:32:30.256144Z","iopub.status.idle":"2024-06-24T08:32:31.882133Z","shell.execute_reply.started":"2024-06-24T08:32:30.256095Z","shell.execute_reply":"2024-06-24T08:32:31.880904Z"},"trusted":true},"execution_count":111,"outputs":[{"execution_count":111,"output_type":"execute_result","data":{"text/plain":"SVC(kernel='linear')","text/html":"<style>#sk-container-id-6 {color: black;background-color: white;}#sk-container-id-6 pre{padding: 0;}#sk-container-id-6 div.sk-toggleable {background-color: white;}#sk-container-id-6 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-6 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-6 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-6 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-6 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-6 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-6 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-6 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-6 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-6 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-6 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-6 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-6 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-6 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-6 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-6 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-6 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-6 div.sk-item {position: relative;z-index: 1;}#sk-container-id-6 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-6 div.sk-item::before, #sk-container-id-6 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-6 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-6 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-6 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-6 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-6 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-6 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-6 div.sk-label-container {text-align: center;}#sk-container-id-6 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-6 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-6\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>SVC(kernel=&#x27;linear&#x27;)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-6\" type=\"checkbox\" checked><label for=\"sk-estimator-id-6\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">SVC</label><div class=\"sk-toggleable__content\"><pre>SVC(kernel=&#x27;linear&#x27;)</pre></div></div></div></div></div>"},"metadata":{}}]},{"cell_type":"code","source":"# Predictions\nprediction = model.predict(X_test)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:31.883960Z","iopub.execute_input":"2024-06-24T08:32:31.884311Z","iopub.status.idle":"2024-06-24T08:32:31.890641Z","shell.execute_reply.started":"2024-06-24T08:32:31.884284Z","shell.execute_reply":"2024-06-24T08:32:31.888687Z"},"trusted":true},"execution_count":112,"outputs":[]},{"cell_type":"code","source":"# Accuracy\naccuracy = accuracy_score(Y_test, prediction)\nprint(f'Accuracy: {accuracy}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:31.893265Z","iopub.execute_input":"2024-06-24T08:32:31.893850Z","iopub.status.idle":"2024-06-24T08:32:31.905892Z","shell.execute_reply.started":"2024-06-24T08:32:31.893805Z","shell.execute_reply":"2024-06-24T08:32:31.904212Z"},"trusted":true},"execution_count":113,"outputs":[{"name":"stdout","text":"Accuracy: 0.956140350877193\n","output_type":"stream"}]},{"cell_type":"code","source":"accuracy_dict['SVM'] = round(accuracy * 100, 2)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:31.907944Z","iopub.execute_input":"2024-06-24T08:32:31.908346Z","iopub.status.idle":"2024-06-24T08:32:31.916944Z","shell.execute_reply.started":"2024-06-24T08:32:31.908314Z","shell.execute_reply":"2024-06-24T08:32:31.915821Z"},"trusted":true},"execution_count":114,"outputs":[]},{"cell_type":"code","source":"# Confusion Matrix\nconf_matrix = confusion_matrix(Y_test, prediction)\nprint(f'Confusion Matrix:\\n{conf_matrix}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:32:31.918278Z","iopub.execute_input":"2024-06-24T08:32:31.918675Z","iopub.status.idle":"2024-06-24T08:32:31.932889Z","shell.execute_reply.started":"2024-06-24T08:32:31.918633Z","shell.execute_reply":"2024-06-24T08:32:31.931595Z"},"trusted":true},"execution_count":115,"outputs":[{"name":"stdout","text":"Confusion Matrix:\n[[38  4]\n [ 1 71]]\n","output_type":"stream"}]},{"cell_type":"code","source":"# Classification Report\nclass_report = classification_report(Y_test, prediction)\nprint(f'Classification Report:\\n{class_report}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:08.046815Z","iopub.execute_input":"2024-06-24T08:33:08.047230Z","iopub.status.idle":"2024-06-24T08:33:08.064365Z","shell.execute_reply.started":"2024-06-24T08:33:08.047198Z","shell.execute_reply":"2024-06-24T08:33:08.062874Z"},"trusted":true},"execution_count":116,"outputs":[{"name":"stdout","text":"Classification Report:\n              precision    recall  f1-score   support\n\n           0       0.97      0.90      0.94        42\n           1       0.95      0.99      0.97        72\n\n    accuracy                           0.96       114\n   macro avg       0.96      0.95      0.95       114\nweighted avg       0.96      0.96      0.96       114\n\n","output_type":"stream"}]},{"cell_type":"markdown","source":"## **k-Nearest Neighbors**","metadata":{}},{"cell_type":"code","source":"from sklearn.neighbors import KNeighborsClassifier","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:09.873558Z","iopub.execute_input":"2024-06-24T08:33:09.874403Z","iopub.status.idle":"2024-06-24T08:33:09.880385Z","shell.execute_reply.started":"2024-06-24T08:33:09.874363Z","shell.execute_reply":"2024-06-24T08:33:09.878342Z"},"trusted":true},"execution_count":117,"outputs":[]},{"cell_type":"code","source":"# Initialize the model\nk = 99  # Choosing k=99 for this example\nmodel = KNeighborsClassifier(n_neighbors=k)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:12.611797Z","iopub.execute_input":"2024-06-24T08:33:12.612317Z","iopub.status.idle":"2024-06-24T08:33:12.618590Z","shell.execute_reply.started":"2024-06-24T08:33:12.612276Z","shell.execute_reply":"2024-06-24T08:33:12.617325Z"},"trusted":true},"execution_count":118,"outputs":[]},{"cell_type":"code","source":"# Train the model\nmodel.fit(X_train, Y_train)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:13.089043Z","iopub.execute_input":"2024-06-24T08:33:13.089446Z","iopub.status.idle":"2024-06-24T08:33:13.099429Z","shell.execute_reply.started":"2024-06-24T08:33:13.089415Z","shell.execute_reply":"2024-06-24T08:33:13.097972Z"},"trusted":true},"execution_count":119,"outputs":[{"execution_count":119,"output_type":"execute_result","data":{"text/plain":"KNeighborsClassifier(n_neighbors=99)","text/html":"<style>#sk-container-id-7 {color: black;background-color: white;}#sk-container-id-7 pre{padding: 0;}#sk-container-id-7 div.sk-toggleable {background-color: white;}#sk-container-id-7 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-7 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-7 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-7 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-7 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-7 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-7 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-7 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-7 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-7 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-7 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-7 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-7 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-7 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-7 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-7 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-7 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-7 div.sk-item {position: relative;z-index: 1;}#sk-container-id-7 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-7 div.sk-item::before, #sk-container-id-7 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-7 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-7 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-7 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-7 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-7 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-7 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-7 div.sk-label-container {text-align: center;}#sk-container-id-7 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-7 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-7\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>KNeighborsClassifier(n_neighbors=99)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-7\" type=\"checkbox\" checked><label for=\"sk-estimator-id-7\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">KNeighborsClassifier</label><div class=\"sk-toggleable__content\"><pre>KNeighborsClassifier(n_neighbors=99)</pre></div></div></div></div></div>"},"metadata":{}}]},{"cell_type":"code","source":"# Predictions\nprediction = model.predict(X_test)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:13.482205Z","iopub.execute_input":"2024-06-24T08:33:13.482625Z","iopub.status.idle":"2024-06-24T08:33:13.551838Z","shell.execute_reply.started":"2024-06-24T08:33:13.482587Z","shell.execute_reply":"2024-06-24T08:33:13.550653Z"},"trusted":true},"execution_count":120,"outputs":[]},{"cell_type":"code","source":"# Accuracy\naccuracy = accuracy_score(Y_test, prediction)\nprint(f'Accuracy: {accuracy}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:14.009733Z","iopub.execute_input":"2024-06-24T08:33:14.010151Z","iopub.status.idle":"2024-06-24T08:33:14.017984Z","shell.execute_reply.started":"2024-06-24T08:33:14.010119Z","shell.execute_reply":"2024-06-24T08:33:14.016846Z"},"trusted":true},"execution_count":121,"outputs":[{"name":"stdout","text":"Accuracy: 0.9210526315789473\n","output_type":"stream"}]},{"cell_type":"code","source":"accuracy_dict['kNN-99'] = round(accuracy * 100, 2)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:14.475762Z","iopub.execute_input":"2024-06-24T08:33:14.476193Z","iopub.status.idle":"2024-06-24T08:33:14.481485Z","shell.execute_reply.started":"2024-06-24T08:33:14.476161Z","shell.execute_reply":"2024-06-24T08:33:14.480361Z"},"trusted":true},"execution_count":122,"outputs":[]},{"cell_type":"code","source":"# Confusion Matrix\nconf_matrix = confusion_matrix(Y_test, prediction)\nprint(f'Confusion Matrix:\\n{conf_matrix}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:14.865244Z","iopub.execute_input":"2024-06-24T08:33:14.865647Z","iopub.status.idle":"2024-06-24T08:33:14.873803Z","shell.execute_reply.started":"2024-06-24T08:33:14.865617Z","shell.execute_reply":"2024-06-24T08:33:14.872454Z"},"trusted":true},"execution_count":123,"outputs":[{"name":"stdout","text":"Confusion Matrix:\n[[35  7]\n [ 2 70]]\n","output_type":"stream"}]},{"cell_type":"code","source":"# Classification Report\nclass_report = classification_report(Y_test, prediction)\nprint(f'Classification Report:\\n{class_report}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:15.271034Z","iopub.execute_input":"2024-06-24T08:33:15.271897Z","iopub.status.idle":"2024-06-24T08:33:15.292649Z","shell.execute_reply.started":"2024-06-24T08:33:15.271860Z","shell.execute_reply":"2024-06-24T08:33:15.291165Z"},"trusted":true},"execution_count":124,"outputs":[{"name":"stdout","text":"Classification Report:\n              precision    recall  f1-score   support\n\n           0       0.95      0.83      0.89        42\n           1       0.91      0.97      0.94        72\n\n    accuracy                           0.92       114\n   macro avg       0.93      0.90      0.91       114\nweighted avg       0.92      0.92      0.92       114\n\n","output_type":"stream"}]},{"cell_type":"markdown","source":"## **Decision Tree**","metadata":{}},{"cell_type":"code","source":"from sklearn.tree import DecisionTreeClassifier","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:16.148428Z","iopub.execute_input":"2024-06-24T08:33:16.149489Z","iopub.status.idle":"2024-06-24T08:33:16.163615Z","shell.execute_reply.started":"2024-06-24T08:33:16.149445Z","shell.execute_reply":"2024-06-24T08:33:16.161901Z"},"trusted":true},"execution_count":125,"outputs":[]},{"cell_type":"code","source":"# Initialize the model\nmodel = DecisionTreeClassifier(random_state=42)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:16.689011Z","iopub.execute_input":"2024-06-24T08:33:16.689430Z","iopub.status.idle":"2024-06-24T08:33:16.695022Z","shell.execute_reply.started":"2024-06-24T08:33:16.689402Z","shell.execute_reply":"2024-06-24T08:33:16.693604Z"},"trusted":true},"execution_count":126,"outputs":[]},{"cell_type":"code","source":"# Train the model\nmodel.fit(X_train, Y_train)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:17.129040Z","iopub.execute_input":"2024-06-24T08:33:17.129457Z","iopub.status.idle":"2024-06-24T08:33:17.148679Z","shell.execute_reply.started":"2024-06-24T08:33:17.129426Z","shell.execute_reply":"2024-06-24T08:33:17.147286Z"},"trusted":true},"execution_count":127,"outputs":[{"execution_count":127,"output_type":"execute_result","data":{"text/plain":"DecisionTreeClassifier(random_state=42)","text/html":"<style>#sk-container-id-8 {color: black;background-color: white;}#sk-container-id-8 pre{padding: 0;}#sk-container-id-8 div.sk-toggleable {background-color: white;}#sk-container-id-8 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-8 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-8 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-8 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-8 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-8 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-8 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-8 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-8 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-8 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-8 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-8 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-8 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-8 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-8 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-8 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-8 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-8 div.sk-item {position: relative;z-index: 1;}#sk-container-id-8 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-8 div.sk-item::before, #sk-container-id-8 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-8 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-8 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-8 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-8 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-8 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-8 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-8 div.sk-label-container {text-align: center;}#sk-container-id-8 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-8 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-8\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>DecisionTreeClassifier(random_state=42)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-8\" type=\"checkbox\" checked><label for=\"sk-estimator-id-8\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">DecisionTreeClassifier</label><div class=\"sk-toggleable__content\"><pre>DecisionTreeClassifier(random_state=42)</pre></div></div></div></div></div>"},"metadata":{}}]},{"cell_type":"code","source":"# Predictions\nprediction = model.predict(X_test)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:17.600465Z","iopub.execute_input":"2024-06-24T08:33:17.600874Z","iopub.status.idle":"2024-06-24T08:33:17.607374Z","shell.execute_reply.started":"2024-06-24T08:33:17.600846Z","shell.execute_reply":"2024-06-24T08:33:17.605501Z"},"trusted":true},"execution_count":128,"outputs":[]},{"cell_type":"code","source":"# Accuracy\naccuracy = accuracy_score(Y_test, prediction)\nprint(f'Accuracy: {accuracy}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:18.071411Z","iopub.execute_input":"2024-06-24T08:33:18.071827Z","iopub.status.idle":"2024-06-24T08:33:18.079924Z","shell.execute_reply.started":"2024-06-24T08:33:18.071799Z","shell.execute_reply":"2024-06-24T08:33:18.078179Z"},"trusted":true},"execution_count":129,"outputs":[{"name":"stdout","text":"Accuracy: 0.9122807017543859\n","output_type":"stream"}]},{"cell_type":"code","source":"accuracy_dict['DT-42'] = round(accuracy * 100, 2)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:18.433722Z","iopub.execute_input":"2024-06-24T08:33:18.434130Z","iopub.status.idle":"2024-06-24T08:33:18.439981Z","shell.execute_reply.started":"2024-06-24T08:33:18.434099Z","shell.execute_reply":"2024-06-24T08:33:18.438055Z"},"trusted":true},"execution_count":130,"outputs":[]},{"cell_type":"code","source":"# Confusion Matrix\nconf_matrix = confusion_matrix(Y_test, prediction)\nprint(f'Confusion Matrix:\\n{conf_matrix}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:18.870802Z","iopub.execute_input":"2024-06-24T08:33:18.871247Z","iopub.status.idle":"2024-06-24T08:33:18.879073Z","shell.execute_reply.started":"2024-06-24T08:33:18.871215Z","shell.execute_reply":"2024-06-24T08:33:18.877958Z"},"trusted":true},"execution_count":131,"outputs":[{"name":"stdout","text":"Confusion Matrix:\n[[39  3]\n [ 7 65]]\n","output_type":"stream"}]},{"cell_type":"code","source":"# Classification Report\nclass_report = classification_report(Y_test, prediction)\nprint(f'Classification Report:\\n{class_report}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:19.488733Z","iopub.execute_input":"2024-06-24T08:33:19.489127Z","iopub.status.idle":"2024-06-24T08:33:19.504035Z","shell.execute_reply.started":"2024-06-24T08:33:19.489097Z","shell.execute_reply":"2024-06-24T08:33:19.502981Z"},"trusted":true},"execution_count":132,"outputs":[{"name":"stdout","text":"Classification Report:\n              precision    recall  f1-score   support\n\n           0       0.85      0.93      0.89        42\n           1       0.96      0.90      0.93        72\n\n    accuracy                           0.91       114\n   macro avg       0.90      0.92      0.91       114\nweighted avg       0.92      0.91      0.91       114\n\n","output_type":"stream"}]},{"cell_type":"markdown","source":"## **Random Forest**","metadata":{}},{"cell_type":"code","source":"from sklearn.ensemble import RandomForestClassifier","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:20.547002Z","iopub.execute_input":"2024-06-24T08:33:20.547409Z","iopub.status.idle":"2024-06-24T08:33:20.624951Z","shell.execute_reply.started":"2024-06-24T08:33:20.547378Z","shell.execute_reply":"2024-06-24T08:33:20.623193Z"},"trusted":true},"execution_count":133,"outputs":[]},{"cell_type":"code","source":"# Initialize the model\nmodel = RandomForestClassifier(random_state=42)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:21.459257Z","iopub.execute_input":"2024-06-24T08:33:21.459698Z","iopub.status.idle":"2024-06-24T08:33:21.465460Z","shell.execute_reply.started":"2024-06-24T08:33:21.459668Z","shell.execute_reply":"2024-06-24T08:33:21.464186Z"},"trusted":true},"execution_count":134,"outputs":[]},{"cell_type":"code","source":"# Train the model\nmodel.fit(X_train, Y_train)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:21.887675Z","iopub.execute_input":"2024-06-24T08:33:21.889290Z","iopub.status.idle":"2024-06-24T08:33:22.166937Z","shell.execute_reply.started":"2024-06-24T08:33:21.889231Z","shell.execute_reply":"2024-06-24T08:33:22.165397Z"},"trusted":true},"execution_count":135,"outputs":[{"execution_count":135,"output_type":"execute_result","data":{"text/plain":"RandomForestClassifier(random_state=42)","text/html":"<style>#sk-container-id-9 {color: black;background-color: white;}#sk-container-id-9 pre{padding: 0;}#sk-container-id-9 div.sk-toggleable {background-color: white;}#sk-container-id-9 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-9 label.sk-toggleable__label-arrow:before {content: \"▸\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-9 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-9 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-9 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-9 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-9 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-9 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"▾\";}#sk-container-id-9 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-9 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-9 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-9 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-9 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-9 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-9 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-9 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-9 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-9 div.sk-item {position: relative;z-index: 1;}#sk-container-id-9 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-9 div.sk-item::before, #sk-container-id-9 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-9 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-9 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-9 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-9 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-9 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-9 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-9 div.sk-label-container {text-align: center;}#sk-container-id-9 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-9 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-9\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>RandomForestClassifier(random_state=42)</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-9\" type=\"checkbox\" checked><label for=\"sk-estimator-id-9\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">RandomForestClassifier</label><div class=\"sk-toggleable__content\"><pre>RandomForestClassifier(random_state=42)</pre></div></div></div></div></div>"},"metadata":{}}]},{"cell_type":"code","source":"# Predictions\nprediction = model.predict(X_test)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:22.361001Z","iopub.execute_input":"2024-06-24T08:33:22.361390Z","iopub.status.idle":"2024-06-24T08:33:22.379099Z","shell.execute_reply.started":"2024-06-24T08:33:22.361360Z","shell.execute_reply":"2024-06-24T08:33:22.377896Z"},"trusted":true},"execution_count":136,"outputs":[]},{"cell_type":"code","source":"# Accuracy\naccuracy = accuracy_score(Y_test, prediction)\nprint(f'Accuracy: {accuracy}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:22.570245Z","iopub.execute_input":"2024-06-24T08:33:22.570661Z","iopub.status.idle":"2024-06-24T08:33:22.577956Z","shell.execute_reply.started":"2024-06-24T08:33:22.570628Z","shell.execute_reply":"2024-06-24T08:33:22.576821Z"},"trusted":true},"execution_count":137,"outputs":[{"name":"stdout","text":"Accuracy: 0.956140350877193\n","output_type":"stream"}]},{"cell_type":"code","source":"accuracy_dict['RF'] = round(accuracy * 100, 2)","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:22.807702Z","iopub.execute_input":"2024-06-24T08:33:22.808408Z","iopub.status.idle":"2024-06-24T08:33:22.813491Z","shell.execute_reply.started":"2024-06-24T08:33:22.808377Z","shell.execute_reply":"2024-06-24T08:33:22.812098Z"},"trusted":true},"execution_count":138,"outputs":[]},{"cell_type":"code","source":"# Confusion Matrix\nconf_matrix = confusion_matrix(Y_test, prediction)\nprint(f'Confusion Matrix:\\n{conf_matrix}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:23.013857Z","iopub.execute_input":"2024-06-24T08:33:23.014272Z","iopub.status.idle":"2024-06-24T08:33:23.022495Z","shell.execute_reply.started":"2024-06-24T08:33:23.014240Z","shell.execute_reply":"2024-06-24T08:33:23.021298Z"},"trusted":true},"execution_count":139,"outputs":[{"name":"stdout","text":"Confusion Matrix:\n[[39  3]\n [ 2 70]]\n","output_type":"stream"}]},{"cell_type":"code","source":"# Classification Report\nclass_report = classification_report(Y_test, prediction)\nprint(f'Classification Report:\\n{class_report}')","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:23.844248Z","iopub.execute_input":"2024-06-24T08:33:23.844762Z","iopub.status.idle":"2024-06-24T08:33:23.864212Z","shell.execute_reply.started":"2024-06-24T08:33:23.844725Z","shell.execute_reply":"2024-06-24T08:33:23.862313Z"},"trusted":true},"execution_count":140,"outputs":[{"name":"stdout","text":"Classification Report:\n              precision    recall  f1-score   support\n\n           0       0.95      0.93      0.94        42\n           1       0.96      0.97      0.97        72\n\n    accuracy                           0.96       114\n   macro avg       0.96      0.95      0.95       114\nweighted avg       0.96      0.96      0.96       114\n\n","output_type":"stream"}]},{"cell_type":"markdown","source":"## **Accuracy Comparison**","metadata":{}},{"cell_type":"code","source":"accuracy_dict","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:28.827662Z","iopub.execute_input":"2024-06-24T08:33:28.828502Z","iopub.status.idle":"2024-06-24T08:33:28.836995Z","shell.execute_reply.started":"2024-06-24T08:33:28.828446Z","shell.execute_reply":"2024-06-24T08:33:28.835658Z"},"trusted":true},"execution_count":141,"outputs":[{"execution_count":141,"output_type":"execute_result","data":{"text/plain":"{'Logistic Regression': 94.74,\n 'SVM': 95.61,\n 'kNN-99': 92.11,\n 'DT-42': 91.23,\n 'RF': 95.61}"},"metadata":{}}]},{"cell_type":"code","source":"import plotly.graph_objects as go","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:29.604210Z","iopub.execute_input":"2024-06-24T08:33:29.604670Z","iopub.status.idle":"2024-06-24T08:33:29.622791Z","shell.execute_reply.started":"2024-06-24T08:33:29.604635Z","shell.execute_reply":"2024-06-24T08:33:29.621236Z"},"trusted":true},"execution_count":142,"outputs":[]},{"cell_type":"code","source":"# Define the data\nmodels = list(accuracy_dict.keys())\naccuracy_scores = list(accuracy_dict.values())\n\n# Create a bar graph\nfig = go.Figure(data=[go.Bar(\n    x=models,\n    y=accuracy_scores,\n    text=accuracy_scores,\n    textposition='auto',\n)])\n\n# Customize layout\nfig.update_layout(\n    title='Accuracy Scores of Different Models',\n    xaxis_title='Models',\n    yaxis_title='Accuracy (%)',\n    yaxis=dict(range=[0, 100]),  # set the range of y-axis\n)\n\n# Show the plot\nfig.show()","metadata":{"execution":{"iopub.status.busy":"2024-06-24T08:33:30.560324Z","iopub.execute_input":"2024-06-24T08:33:30.560773Z","iopub.status.idle":"2024-06-24T08:33:31.112170Z","shell.execute_reply.started":"2024-06-24T08:33:30.560716Z","shell.execute_reply":"2024-06-24T08:33:31.110816Z"},"trusted":true},"execution_count":143,"outputs":[{"output_type":"display_data","data":{"text/html":"        <script type=\"text/javascript\">\n        window.PlotlyConfig = {MathJaxConfig: 'local'};\n        if (window.MathJax && window.MathJax.Hub && window.MathJax.Hub.Config) {window.MathJax.Hub.Config({SVG: {font: \"STIX-Web\"}});}\n        if (typeof require !== 'undefined') {\n        require.undef(\"plotly\");\n        requirejs.config({\n            paths: {\n                'plotly': ['https://cdn.plot.ly/plotly-2.27.0.min']\n            }\n        });\n        require(['plotly'], function(Plotly) {\n            window._Plotly = Plotly;\n        });\n        }\n        </script>\n        "},"metadata":{}},{"output_type":"display_data","data":{"text/html":"<div>                            <div id=\"cc439224-c6fc-44ff-b70a-bc75a24d4fa5\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div>            <script type=\"text/javascript\">                require([\"plotly\"], function(Plotly) {                    window.PLOTLYENV=window.PLOTLYENV || {};                                    if (document.getElementById(\"cc439224-c6fc-44ff-b70a-bc75a24d4fa5\")) {                    Plotly.newPlot(                        \"cc439224-c6fc-44ff-b70a-bc75a24d4fa5\",                        [{\"text\":[\"94.74\",\"95.61\",\"92.11\",\"91.23\",\"95.61\"],\"textposition\":\"auto\",\"x\":[\"Logistic Regression\",\"SVM\",\"kNN-99\",\"DT-42\",\"RF\"],\"y\":[94.74,95.61,92.11,91.23,95.61],\"type\":\"bar\"}],                        {\"template\":{\"data\":{\"histogram2dcontour\":[{\"type\":\"histogram2dcontour\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"},\"colorscale\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]]}],\"choropleth\":[{\"type\":\"choropleth\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}],\"histogram2d\":[{\"type\":\"histogram2d\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"},\"colorscale\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]]}],\"heatmap\":[{\"type\":\"heatmap\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"},\"colorscale\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]]}],\"heatmapgl\":[{\"type\":\"heatmapgl\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"},\"colorscale\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]]}],\"contourcarpet\":[{\"type\":\"contourcarpet\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}],\"contour\":[{\"type\":\"contour\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"},\"colorscale\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]]}],\"surface\":[{\"type\":\"surface\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"},\"colorscale\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]]}],\"mesh3d\":[{\"type\":\"mesh3d\",\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}],\"scatter\":[{\"fillpattern\":{\"fillmode\":\"overlay\",\"size\":10,\"solidity\":0.2},\"type\":\"scatter\"}],\"parcoords\":[{\"type\":\"parcoords\",\"line\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"scatterpolargl\":[{\"type\":\"scatterpolargl\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"bar\":[{\"error_x\":{\"color\":\"#2a3f5f\"},\"error_y\":{\"color\":\"#2a3f5f\"},\"marker\":{\"line\":{\"color\":\"#E5ECF6\",\"width\":0.5},\"pattern\":{\"fillmode\":\"overlay\",\"size\":10,\"solidity\":0.2}},\"type\":\"bar\"}],\"scattergeo\":[{\"type\":\"scattergeo\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"scatterpolar\":[{\"type\":\"scatterpolar\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"histogram\":[{\"marker\":{\"pattern\":{\"fillmode\":\"overlay\",\"size\":10,\"solidity\":0.2}},\"type\":\"histogram\"}],\"scattergl\":[{\"type\":\"scattergl\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"scatter3d\":[{\"type\":\"scatter3d\",\"line\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}},\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"scattermapbox\":[{\"type\":\"scattermapbox\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"scatterternary\":[{\"type\":\"scatterternary\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"scattercarpet\":[{\"type\":\"scattercarpet\",\"marker\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}}}],\"carpet\":[{\"aaxis\":{\"endlinecolor\":\"#2a3f5f\",\"gridcolor\":\"white\",\"linecolor\":\"white\",\"minorgridcolor\":\"white\",\"startlinecolor\":\"#2a3f5f\"},\"baxis\":{\"endlinecolor\":\"#2a3f5f\",\"gridcolor\":\"white\",\"linecolor\":\"white\",\"minorgridcolor\":\"white\",\"startlinecolor\":\"#2a3f5f\"},\"type\":\"carpet\"}],\"table\":[{\"cells\":{\"fill\":{\"color\":\"#EBF0F8\"},\"line\":{\"color\":\"white\"}},\"header\":{\"fill\":{\"color\":\"#C8D4E3\"},\"line\":{\"color\":\"white\"}},\"type\":\"table\"}],\"barpolar\":[{\"marker\":{\"line\":{\"color\":\"#E5ECF6\",\"width\":0.5},\"pattern\":{\"fillmode\":\"overlay\",\"size\":10,\"solidity\":0.2}},\"type\":\"barpolar\"}],\"pie\":[{\"automargin\":true,\"type\":\"pie\"}]},\"layout\":{\"autotypenumbers\":\"strict\",\"colorway\":[\"#636efa\",\"#EF553B\",\"#00cc96\",\"#ab63fa\",\"#FFA15A\",\"#19d3f3\",\"#FF6692\",\"#B6E880\",\"#FF97FF\",\"#FECB52\"],\"font\":{\"color\":\"#2a3f5f\"},\"hovermode\":\"closest\",\"hoverlabel\":{\"align\":\"left\"},\"paper_bgcolor\":\"white\",\"plot_bgcolor\":\"#E5ECF6\",\"polar\":{\"bgcolor\":\"#E5ECF6\",\"angularaxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\"},\"radialaxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\"}},\"ternary\":{\"bgcolor\":\"#E5ECF6\",\"aaxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\"},\"baxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\"},\"caxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\"}},\"coloraxis\":{\"colorbar\":{\"outlinewidth\":0,\"ticks\":\"\"}},\"colorscale\":{\"sequential\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]],\"sequentialminus\":[[0.0,\"#0d0887\"],[0.1111111111111111,\"#46039f\"],[0.2222222222222222,\"#7201a8\"],[0.3333333333333333,\"#9c179e\"],[0.4444444444444444,\"#bd3786\"],[0.5555555555555556,\"#d8576b\"],[0.6666666666666666,\"#ed7953\"],[0.7777777777777778,\"#fb9f3a\"],[0.8888888888888888,\"#fdca26\"],[1.0,\"#f0f921\"]],\"diverging\":[[0,\"#8e0152\"],[0.1,\"#c51b7d\"],[0.2,\"#de77ae\"],[0.3,\"#f1b6da\"],[0.4,\"#fde0ef\"],[0.5,\"#f7f7f7\"],[0.6,\"#e6f5d0\"],[0.7,\"#b8e186\"],[0.8,\"#7fbc41\"],[0.9,\"#4d9221\"],[1,\"#276419\"]]},\"xaxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\",\"title\":{\"standoff\":15},\"zerolinecolor\":\"white\",\"automargin\":true,\"zerolinewidth\":2},\"yaxis\":{\"gridcolor\":\"white\",\"linecolor\":\"white\",\"ticks\":\"\",\"title\":{\"standoff\":15},\"zerolinecolor\":\"white\",\"automargin\":true,\"zerolinewidth\":2},\"scene\":{\"xaxis\":{\"backgroundcolor\":\"#E5ECF6\",\"gridcolor\":\"white\",\"linecolor\":\"white\",\"showbackground\":true,\"ticks\":\"\",\"zerolinecolor\":\"white\",\"gridwidth\":2},\"yaxis\":{\"backgroundcolor\":\"#E5ECF6\",\"gridcolor\":\"white\",\"linecolor\":\"white\",\"showbackground\":true,\"ticks\":\"\",\"zerolinecolor\":\"white\",\"gridwidth\":2},\"zaxis\":{\"backgroundcolor\":\"#E5ECF6\",\"gridcolor\":\"white\",\"linecolor\":\"white\",\"showbackground\":true,\"ticks\":\"\",\"zerolinecolor\":\"white\",\"gridwidth\":2}},\"shapedefaults\":{\"line\":{\"color\":\"#2a3f5f\"}},\"annotationdefaults\":{\"arrowcolor\":\"#2a3f5f\",\"arrowhead\":0,\"arrowwidth\":1},\"geo\":{\"bgcolor\":\"white\",\"landcolor\":\"#E5ECF6\",\"subunitcolor\":\"white\",\"showland\":true,\"showlakes\":true,\"lakecolor\":\"white\"},\"title\":{\"x\":0.05},\"mapbox\":{\"style\":\"light\"}}},\"yaxis\":{\"title\":{\"text\":\"Accuracy (%)\"},\"range\":[0,100]},\"title\":{\"text\":\"Accuracy Scores of Different Models\"},\"xaxis\":{\"title\":{\"text\":\"Models\"}}},                        {\"responsive\": true}                    ).then(function(){\n                            \nvar gd = document.getElementById('cc439224-c6fc-44ff-b70a-bc75a24d4fa5');\nvar x = new MutationObserver(function (mutations, observer) {{\n        var display = window.getComputedStyle(gd).display;\n        if (!display || display === 'none') {{\n            console.log([gd, 'removed!']);\n            Plotly.purge(gd);\n            observer.disconnect();\n        }}\n}});\n\n// Listen for the removal of the full notebook cells\nvar notebookContainer = gd.closest('#notebook-container');\nif (notebookContainer) {{\n    x.observe(notebookContainer, {childList: true});\n}}\n\n// Listen for the clearing of the current output cell\nvar outputEl = gd.closest('.output');\nif (outputEl) {{\n    x.observe(outputEl, {childList: true});\n}}\n\n                        })                };                });            </script>        </div>"},"metadata":{}}]}]}
\ No newline at end of file