diff --git a/Breast_Cancer_Classification_ueing_Neural_Network.ipynb b/Breast_Cancer_Classification_ueing_Neural_Network.ipynb new file mode 100644 index 00000000..1de6685e --- /dev/null +++ b/Breast_Cancer_Classification_ueing_Neural_Network.ipynb @@ -0,0 +1,3256 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "authorship_tag": "ABX9TyNd3jP5HcwJSesVQ0jh9ClI", + "include_colab_link": true + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "view-in-github", + "colab_type": "text" + }, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "markdown", + "source": [ + "## **Importing the Dependencies**" + ], + "metadata": { + "id": "E8zRUcqtiMOY" + } + }, + { + "cell_type": "code", + "execution_count": 35, + "metadata": { + "id": "oOiX8ojWiA5B" + }, + "outputs": [], + "source": [ + "import numpy as np\n", + "import pandas as pd\n", + "import matplotlib.pyplot as plt\n", + "import sklearn.datasets\n", + "from sklearn.model_selection import train_test_split" + ] + }, + { + "cell_type": "markdown", + "source": [ + "##**Data Collection & Processing**" + ], + "metadata": { + "id": "3qnTVfnvp7V-" + } + }, + { + "cell_type": "code", + "source": [ + "#loading the data from sklearn\n", + "breast_cancer_dataset=sklearn.datasets.load_breast_cancer()" + ], + "metadata": { + "id": "QXM_di5VqANh" + }, + "execution_count": 3, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "print(breast_cancer_dataset)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "cZftaZOLrWvU", + "outputId": "afa210cb-60c4-4f84-bfc1-52df1f082638" + }, + "execution_count": 4, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "{'data': array([[1.799e+01, 1.038e+01, 1.228e+02, ..., 2.654e-01, 4.601e-01,\n", + " 1.189e-01],\n", + " [2.057e+01, 1.777e+01, 1.329e+02, ..., 1.860e-01, 2.750e-01,\n", + " 8.902e-02],\n", + " [1.969e+01, 2.125e+01, 1.300e+02, ..., 2.430e-01, 3.613e-01,\n", + " 8.758e-02],\n", + " ...,\n", + " [1.660e+01, 2.808e+01, 1.083e+02, ..., 1.418e-01, 2.218e-01,\n", + " 7.820e-02],\n", + " [2.060e+01, 2.933e+01, 1.401e+02, ..., 2.650e-01, 4.087e-01,\n", + " 1.240e-01],\n", + " [7.760e+00, 2.454e+01, 4.792e+01, ..., 0.000e+00, 2.871e-01,\n", + " 7.039e-02]]), 'target': array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1,\n", + " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0,\n", + " 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0,\n", + " 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0,\n", + " 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1,\n", + " 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0,\n", + " 0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1,\n", + " 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1,\n", + " 1, 0, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0,\n", + " 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0,\n", + " 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 1,\n", + " 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n", + " 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1,\n", + " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1,\n", + " 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0,\n", + " 0, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0,\n", + " 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0,\n", + " 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1,\n", + " 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0,\n", + " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1,\n", + " 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0,\n", + " 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1,\n", + " 1, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1,\n", + " 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1,\n", + " 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", + " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1]), 'frame': None, 'target_names': array(['malignant', 'benign'], dtype='\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
mean radiusmean texturemean perimetermean areamean smoothnessmean compactnessmean concavitymean concave pointsmean symmetrymean fractal dimension...worst radiusworst textureworst perimeterworst areaworst smoothnessworst compactnessworst concavityworst concave pointsworst symmetryworst fractal dimension
017.9910.38122.801001.00.118400.277600.30010.147100.24190.07871...25.3817.33184.602019.00.16220.66560.71190.26540.46010.11890
120.5717.77132.901326.00.084740.078640.08690.070170.18120.05667...24.9923.41158.801956.00.12380.18660.24160.18600.27500.08902
219.6921.25130.001203.00.109600.159900.19740.127900.20690.05999...23.5725.53152.501709.00.14440.42450.45040.24300.36130.08758
311.4220.3877.58386.10.142500.283900.24140.105200.25970.09744...14.9126.5098.87567.70.20980.86630.68690.25750.66380.17300
420.2914.34135.101297.00.100300.132800.19800.104300.18090.05883...22.5416.67152.201575.00.13740.20500.40000.16250.23640.07678
\n", + "

5 rows × 30 columns

\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + " \n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe", + "variable_name": "df" + } + }, + "metadata": {}, + "execution_count": 6 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# adding the 'target' column to the data frame\n", + "df['label']=breast_cancer_dataset.target" + ], + "metadata": { + "id": "Vpl_HsMhsxjm" + }, + "execution_count": 7, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "# print las 5 rows from the dataframe\n", + "df.tail()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 290 + }, + "id": "7btJtVpvtZgc", + "outputId": "62c4fc60-7e9d-49b4-a55a-8c6b669e4ce9" + }, + "execution_count": 8, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " mean radius mean texture mean perimeter mean area mean smoothness \\\n", + "564 21.56 22.39 142.00 1479.0 0.11100 \n", + "565 20.13 28.25 131.20 1261.0 0.09780 \n", + "566 16.60 28.08 108.30 858.1 0.08455 \n", + "567 20.60 29.33 140.10 1265.0 0.11780 \n", + "568 7.76 24.54 47.92 181.0 0.05263 \n", + "\n", + " mean compactness mean concavity mean concave points mean symmetry \\\n", + "564 0.11590 0.24390 0.13890 0.1726 \n", + "565 0.10340 0.14400 0.09791 0.1752 \n", + "566 0.10230 0.09251 0.05302 0.1590 \n", + "567 0.27700 0.35140 0.15200 0.2397 \n", + "568 0.04362 0.00000 0.00000 0.1587 \n", + "\n", + " mean fractal dimension ... worst texture worst perimeter worst area \\\n", + "564 0.05623 ... 26.40 166.10 2027.0 \n", + "565 0.05533 ... 38.25 155.00 1731.0 \n", + "566 0.05648 ... 34.12 126.70 1124.0 \n", + "567 0.07016 ... 39.42 184.60 1821.0 \n", + "568 0.05884 ... 30.37 59.16 268.6 \n", + "\n", + " worst smoothness worst compactness worst concavity \\\n", + "564 0.14100 0.21130 0.4107 \n", + "565 0.11660 0.19220 0.3215 \n", + "566 0.11390 0.30940 0.3403 \n", + "567 0.16500 0.86810 0.9387 \n", + "568 0.08996 0.06444 0.0000 \n", + "\n", + " worst concave points worst symmetry worst fractal dimension label \n", + "564 0.2216 0.2060 0.07115 0 \n", + "565 0.1628 0.2572 0.06637 0 \n", + "566 0.1418 0.2218 0.07820 0 \n", + "567 0.2650 0.4087 0.12400 0 \n", + "568 0.0000 0.2871 0.07039 1 \n", + "\n", + "[5 rows x 31 columns]" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
mean radiusmean texturemean perimetermean areamean smoothnessmean compactnessmean concavitymean concave pointsmean symmetrymean fractal dimension...worst textureworst perimeterworst areaworst smoothnessworst compactnessworst concavityworst concave pointsworst symmetryworst fractal dimensionlabel
56421.5622.39142.001479.00.111000.115900.243900.138900.17260.05623...26.40166.102027.00.141000.211300.41070.22160.20600.071150
56520.1328.25131.201261.00.097800.103400.144000.097910.17520.05533...38.25155.001731.00.116600.192200.32150.16280.25720.066370
56616.6028.08108.30858.10.084550.102300.092510.053020.15900.05648...34.12126.701124.00.113900.309400.34030.14180.22180.078200
56720.6029.33140.101265.00.117800.277000.351400.152000.23970.07016...39.42184.601821.00.165000.868100.93870.26500.40870.124000
5687.7624.5447.92181.00.052630.043620.000000.000000.15870.05884...30.3759.16268.60.089960.064440.00000.00000.28710.070391
\n", + "

5 rows × 31 columns

\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + "
\n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe" + } + }, + "metadata": {}, + "execution_count": 8 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# number of rows and columns in the dataset\n", + "df.shape" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "Yd4BbsOytrNG", + "outputId": "a7cf14ba-2ff7-41fd-efbd-2038ae8aebaa" + }, + "execution_count": 9, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "(569, 31)" + ] + }, + "metadata": {}, + "execution_count": 9 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# getting some information about the data\n", + "df.info()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "r0x-Q8L9t58I", + "outputId": "3477ee64-0df8-44b5-ecab-5ef31dd3865a" + }, + "execution_count": 10, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\n", + "RangeIndex: 569 entries, 0 to 568\n", + "Data columns (total 31 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 mean radius 569 non-null float64\n", + " 1 mean texture 569 non-null float64\n", + " 2 mean perimeter 569 non-null float64\n", + " 3 mean area 569 non-null float64\n", + " 4 mean smoothness 569 non-null float64\n", + " 5 mean compactness 569 non-null float64\n", + " 6 mean concavity 569 non-null float64\n", + " 7 mean concave points 569 non-null float64\n", + " 8 mean symmetry 569 non-null float64\n", + " 9 mean fractal dimension 569 non-null float64\n", + " 10 radius error 569 non-null float64\n", + " 11 texture error 569 non-null float64\n", + " 12 perimeter error 569 non-null float64\n", + " 13 area error 569 non-null float64\n", + " 14 smoothness error 569 non-null float64\n", + " 15 compactness error 569 non-null float64\n", + " 16 concavity error 569 non-null float64\n", + " 17 concave points error 569 non-null float64\n", + " 18 symmetry error 569 non-null float64\n", + " 19 fractal dimension error 569 non-null float64\n", + " 20 worst radius 569 non-null float64\n", + " 21 worst texture 569 non-null float64\n", + " 22 worst perimeter 569 non-null float64\n", + " 23 worst area 569 non-null float64\n", + " 24 worst smoothness 569 non-null float64\n", + " 25 worst compactness 569 non-null float64\n", + " 26 worst concavity 569 non-null float64\n", + " 27 worst concave points 569 non-null float64\n", + " 28 worst symmetry 569 non-null float64\n", + " 29 worst fractal dimension 569 non-null float64\n", + " 30 label 569 non-null int64 \n", + "dtypes: float64(30), int64(1)\n", + "memory usage: 137.9 KB\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "# checking for missing values\n", + "df.isnull().sum()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 1000 + }, + "id": "y13eCoZZuN3a", + "outputId": "fb86fa4f-0763-4cb9-f2dd-13f1d907cd74" + }, + "execution_count": 11, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "mean radius 0\n", + "mean texture 0\n", + "mean perimeter 0\n", + "mean area 0\n", + "mean smoothness 0\n", + "mean compactness 0\n", + "mean concavity 0\n", + "mean concave points 0\n", + "mean symmetry 0\n", + "mean fractal dimension 0\n", + "radius error 0\n", + "texture error 0\n", + "perimeter error 0\n", + "area error 0\n", + "smoothness error 0\n", + "compactness error 0\n", + "concavity error 0\n", + "concave points error 0\n", + "symmetry error 0\n", + "fractal dimension error 0\n", + "worst radius 0\n", + "worst texture 0\n", + "worst perimeter 0\n", + "worst area 0\n", + "worst smoothness 0\n", + "worst compactness 0\n", + "worst concavity 0\n", + "worst concave points 0\n", + "worst symmetry 0\n", + "worst fractal dimension 0\n", + "label 0\n", + "dtype: int64" + ], + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
0
mean radius0
mean texture0
mean perimeter0
mean area0
mean smoothness0
mean compactness0
mean concavity0
mean concave points0
mean symmetry0
mean fractal dimension0
radius error0
texture error0
perimeter error0
area error0
smoothness error0
compactness error0
concavity error0
concave points error0
symmetry error0
fractal dimension error0
worst radius0
worst texture0
worst perimeter0
worst area0
worst smoothness0
worst compactness0
worst concavity0
worst concave points0
worst symmetry0
worst fractal dimension0
label0
\n", + "

" + ] + }, + "metadata": {}, + "execution_count": 11 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# statistical measures about the data\n", + "df.describe()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 384 + }, + "id": "d7LX7wrGuasC", + "outputId": "4674c533-1db1-4b3f-e4de-b7efd2f9ed1a" + }, + "execution_count": 12, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " mean radius mean texture mean perimeter mean area \\\n", + "count 569.000000 569.000000 569.000000 569.000000 \n", + "mean 14.127292 19.289649 91.969033 654.889104 \n", + "std 3.524049 4.301036 24.298981 351.914129 \n", + "min 6.981000 9.710000 43.790000 143.500000 \n", + "25% 11.700000 16.170000 75.170000 420.300000 \n", + "50% 13.370000 18.840000 86.240000 551.100000 \n", + "75% 15.780000 21.800000 104.100000 782.700000 \n", + "max 28.110000 39.280000 188.500000 2501.000000 \n", + "\n", + " mean smoothness mean compactness mean concavity mean concave points \\\n", + "count 569.000000 569.000000 569.000000 569.000000 \n", + "mean 0.096360 0.104341 0.088799 0.048919 \n", + "std 0.014064 0.052813 0.079720 0.038803 \n", + "min 0.052630 0.019380 0.000000 0.000000 \n", + "25% 0.086370 0.064920 0.029560 0.020310 \n", + "50% 0.095870 0.092630 0.061540 0.033500 \n", + "75% 0.105300 0.130400 0.130700 0.074000 \n", + "max 0.163400 0.345400 0.426800 0.201200 \n", + "\n", + " mean symmetry mean fractal dimension ... worst texture \\\n", + "count 569.000000 569.000000 ... 569.000000 \n", + "mean 0.181162 0.062798 ... 25.677223 \n", + "std 0.027414 0.007060 ... 6.146258 \n", + "min 0.106000 0.049960 ... 12.020000 \n", + "25% 0.161900 0.057700 ... 21.080000 \n", + "50% 0.179200 0.061540 ... 25.410000 \n", + "75% 0.195700 0.066120 ... 29.720000 \n", + "max 0.304000 0.097440 ... 49.540000 \n", + "\n", + " worst perimeter worst area worst smoothness worst compactness \\\n", + "count 569.000000 569.000000 569.000000 569.000000 \n", + "mean 107.261213 880.583128 0.132369 0.254265 \n", + "std 33.602542 569.356993 0.022832 0.157336 \n", + "min 50.410000 185.200000 0.071170 0.027290 \n", + "25% 84.110000 515.300000 0.116600 0.147200 \n", + "50% 97.660000 686.500000 0.131300 0.211900 \n", + "75% 125.400000 1084.000000 0.146000 0.339100 \n", + "max 251.200000 4254.000000 0.222600 1.058000 \n", + "\n", + " worst concavity worst concave points worst symmetry \\\n", + "count 569.000000 569.000000 569.000000 \n", + "mean 0.272188 0.114606 0.290076 \n", + "std 0.208624 0.065732 0.061867 \n", + "min 0.000000 0.000000 0.156500 \n", + "25% 0.114500 0.064930 0.250400 \n", + "50% 0.226700 0.099930 0.282200 \n", + "75% 0.382900 0.161400 0.317900 \n", + "max 1.252000 0.291000 0.663800 \n", + "\n", + " worst fractal dimension label \n", + "count 569.000000 569.000000 \n", + "mean 0.083946 0.627417 \n", + "std 0.018061 0.483918 \n", + "min 0.055040 0.000000 \n", + "25% 0.071460 0.000000 \n", + "50% 0.080040 1.000000 \n", + "75% 0.092080 1.000000 \n", + "max 0.207500 1.000000 \n", + "\n", + "[8 rows x 31 columns]" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
mean radiusmean texturemean perimetermean areamean smoothnessmean compactnessmean concavitymean concave pointsmean symmetrymean fractal dimension...worst textureworst perimeterworst areaworst smoothnessworst compactnessworst concavityworst concave pointsworst symmetryworst fractal dimensionlabel
count569.000000569.000000569.000000569.000000569.000000569.000000569.000000569.000000569.000000569.000000...569.000000569.000000569.000000569.000000569.000000569.000000569.000000569.000000569.000000569.000000
mean14.12729219.28964991.969033654.8891040.0963600.1043410.0887990.0489190.1811620.062798...25.677223107.261213880.5831280.1323690.2542650.2721880.1146060.2900760.0839460.627417
std3.5240494.30103624.298981351.9141290.0140640.0528130.0797200.0388030.0274140.007060...6.14625833.602542569.3569930.0228320.1573360.2086240.0657320.0618670.0180610.483918
min6.9810009.71000043.790000143.5000000.0526300.0193800.0000000.0000000.1060000.049960...12.02000050.410000185.2000000.0711700.0272900.0000000.0000000.1565000.0550400.000000
25%11.70000016.17000075.170000420.3000000.0863700.0649200.0295600.0203100.1619000.057700...21.08000084.110000515.3000000.1166000.1472000.1145000.0649300.2504000.0714600.000000
50%13.37000018.84000086.240000551.1000000.0958700.0926300.0615400.0335000.1792000.061540...25.41000097.660000686.5000000.1313000.2119000.2267000.0999300.2822000.0800401.000000
75%15.78000021.800000104.100000782.7000000.1053000.1304000.1307000.0740000.1957000.066120...29.720000125.4000001084.0000000.1460000.3391000.3829000.1614000.3179000.0920801.000000
max28.11000039.280000188.5000002501.0000000.1634000.3454000.4268000.2012000.3040000.097440...49.540000251.2000004254.0000000.2226001.0580001.2520000.2910000.6638000.2075001.000000
\n", + "

8 rows × 31 columns

\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + "
\n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe" + } + }, + "metadata": {}, + "execution_count": 12 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# checking the distribution of Target Varaibles\n", + "df['label'].value_counts()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 178 + }, + "id": "WsVmI1yqvH1j", + "outputId": "c59388ce-cf49-4929-a2dd-48df3ea0015b" + }, + "execution_count": 13, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "label\n", + "1 357\n", + "0 212\n", + "Name: count, dtype: int64" + ], + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
count
label
1357
0212
\n", + "

" + ] + }, + "metadata": {}, + "execution_count": 13 + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "**1-> Benign\n", + "0-> Malignant**" + ], + "metadata": { + "id": "ggvuJcH5vcXN" + } + }, + { + "cell_type": "code", + "source": [ + "df.groupby('label').mean()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 227 + }, + "id": "xtTpxOfrviaT", + "outputId": "25c2e346-a239-4b82-a750-d121bf87b12b" + }, + "execution_count": 14, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " mean radius mean texture mean perimeter mean area mean smoothness \\\n", + "label \n", + "0 17.462830 21.604906 115.365377 978.376415 0.102898 \n", + "1 12.146524 17.914762 78.075406 462.790196 0.092478 \n", + "\n", + " mean compactness mean concavity mean concave points mean symmetry \\\n", + "label \n", + "0 0.145188 0.160775 0.087990 0.192909 \n", + "1 0.080085 0.046058 0.025717 0.174186 \n", + "\n", + " mean fractal dimension ... worst radius worst texture \\\n", + "label ... \n", + "0 0.062680 ... 21.134811 29.318208 \n", + "1 0.062867 ... 13.379801 23.515070 \n", + "\n", + " worst perimeter worst area worst smoothness worst compactness \\\n", + "label \n", + "0 141.370330 1422.286321 0.144845 0.374824 \n", + "1 87.005938 558.899440 0.124959 0.182673 \n", + "\n", + " worst concavity worst concave points worst symmetry \\\n", + "label \n", + "0 0.450606 0.182237 0.323468 \n", + "1 0.166238 0.074444 0.270246 \n", + "\n", + " worst fractal dimension \n", + "label \n", + "0 0.091530 \n", + "1 0.079442 \n", + "\n", + "[2 rows x 30 columns]" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
mean radiusmean texturemean perimetermean areamean smoothnessmean compactnessmean concavitymean concave pointsmean symmetrymean fractal dimension...worst radiusworst textureworst perimeterworst areaworst smoothnessworst compactnessworst concavityworst concave pointsworst symmetryworst fractal dimension
label
017.46283021.604906115.365377978.3764150.1028980.1451880.1607750.0879900.1929090.062680...21.13481129.318208141.3703301422.2863210.1448450.3748240.4506060.1822370.3234680.091530
112.14652417.91476278.075406462.7901960.0924780.0800850.0460580.0257170.1741860.062867...13.37980123.51507087.005938558.8994400.1249590.1826730.1662380.0744440.2702460.079442
\n", + "

2 rows × 30 columns

\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + "
\n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe" + } + }, + "metadata": {}, + "execution_count": 14 + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "##**Seperating the features and target**" + ], + "metadata": { + "id": "_xax7xxQwaL4" + } + }, + { + "cell_type": "code", + "source": [ + "X=df.drop(columns='label',axis=1)\n", + "Y=df['label']" + ], + "metadata": { + "id": "7Za21RYlwZxK" + }, + "execution_count": 15, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "print(X)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "MyaUAQZMwso1", + "outputId": "57696704-b668-4dce-db24-4a0ebe941496" + }, + "execution_count": 16, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + " mean radius mean texture mean perimeter mean area mean smoothness \\\n", + "0 17.99 10.38 122.80 1001.0 0.11840 \n", + "1 20.57 17.77 132.90 1326.0 0.08474 \n", + "2 19.69 21.25 130.00 1203.0 0.10960 \n", + "3 11.42 20.38 77.58 386.1 0.14250 \n", + "4 20.29 14.34 135.10 1297.0 0.10030 \n", + ".. ... ... ... ... ... \n", + "564 21.56 22.39 142.00 1479.0 0.11100 \n", + "565 20.13 28.25 131.20 1261.0 0.09780 \n", + "566 16.60 28.08 108.30 858.1 0.08455 \n", + "567 20.60 29.33 140.10 1265.0 0.11780 \n", + "568 7.76 24.54 47.92 181.0 0.05263 \n", + "\n", + " mean compactness mean concavity mean concave points mean symmetry \\\n", + "0 0.27760 0.30010 0.14710 0.2419 \n", + "1 0.07864 0.08690 0.07017 0.1812 \n", + "2 0.15990 0.19740 0.12790 0.2069 \n", + "3 0.28390 0.24140 0.10520 0.2597 \n", + "4 0.13280 0.19800 0.10430 0.1809 \n", + ".. ... ... ... ... \n", + "564 0.11590 0.24390 0.13890 0.1726 \n", + "565 0.10340 0.14400 0.09791 0.1752 \n", + "566 0.10230 0.09251 0.05302 0.1590 \n", + "567 0.27700 0.35140 0.15200 0.2397 \n", + "568 0.04362 0.00000 0.00000 0.1587 \n", + "\n", + " mean fractal dimension ... worst radius worst texture \\\n", + "0 0.07871 ... 25.380 17.33 \n", + "1 0.05667 ... 24.990 23.41 \n", + "2 0.05999 ... 23.570 25.53 \n", + "3 0.09744 ... 14.910 26.50 \n", + "4 0.05883 ... 22.540 16.67 \n", + ".. ... ... ... ... \n", + "564 0.05623 ... 25.450 26.40 \n", + "565 0.05533 ... 23.690 38.25 \n", + "566 0.05648 ... 18.980 34.12 \n", + "567 0.07016 ... 25.740 39.42 \n", + "568 0.05884 ... 9.456 30.37 \n", + "\n", + " worst perimeter worst area worst smoothness worst compactness \\\n", + "0 184.60 2019.0 0.16220 0.66560 \n", + "1 158.80 1956.0 0.12380 0.18660 \n", + "2 152.50 1709.0 0.14440 0.42450 \n", + "3 98.87 567.7 0.20980 0.86630 \n", + "4 152.20 1575.0 0.13740 0.20500 \n", + ".. ... ... ... ... \n", + "564 166.10 2027.0 0.14100 0.21130 \n", + "565 155.00 1731.0 0.11660 0.19220 \n", + "566 126.70 1124.0 0.11390 0.30940 \n", + "567 184.60 1821.0 0.16500 0.86810 \n", + "568 59.16 268.6 0.08996 0.06444 \n", + "\n", + " worst concavity worst concave points worst symmetry \\\n", + "0 0.7119 0.2654 0.4601 \n", + "1 0.2416 0.1860 0.2750 \n", + "2 0.4504 0.2430 0.3613 \n", + "3 0.6869 0.2575 0.6638 \n", + "4 0.4000 0.1625 0.2364 \n", + ".. ... ... ... \n", + "564 0.4107 0.2216 0.2060 \n", + "565 0.3215 0.1628 0.2572 \n", + "566 0.3403 0.1418 0.2218 \n", + "567 0.9387 0.2650 0.4087 \n", + "568 0.0000 0.0000 0.2871 \n", + "\n", + " worst fractal dimension \n", + "0 0.11890 \n", + "1 0.08902 \n", + "2 0.08758 \n", + "3 0.17300 \n", + "4 0.07678 \n", + ".. ... \n", + "564 0.07115 \n", + "565 0.06637 \n", + "566 0.07820 \n", + "567 0.12400 \n", + "568 0.07039 \n", + "\n", + "[569 rows x 30 columns]\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "print(Y)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "OepIQmtdw_B7", + "outputId": "46cd8682-2c96-4ff2-8db6-e403f4cae5af" + }, + "execution_count": 17, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "0 0\n", + "1 0\n", + "2 0\n", + "3 0\n", + "4 0\n", + " ..\n", + "564 0\n", + "565 0\n", + "566 0\n", + "567 0\n", + "568 1\n", + "Name: label, Length: 569, dtype: int64\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "Splitting the data into training data & testing data" + ], + "metadata": { + "id": "NzOB9_ixxHSO" + } + }, + { + "cell_type": "code", + "source": [ + "X_train,X_test,Y_train,Y_test=train_test_split(X,Y,test_size=0.2,random_state=2)" + ], + "metadata": { + "id": "YAn9ZAbPxRqO" + }, + "execution_count": 18, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "print(X.shape,X_train.shape,X_test.shape)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "ZorMWSzdxs0Z", + "outputId": "e71acd9d-2d3c-4358-daf4-74ac3afe00dc" + }, + "execution_count": 19, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "(569, 30) (455, 30) (114, 30)\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "Standardize the data" + ], + "metadata": { + "id": "BkZZNyBGBGJd" + } + }, + { + "cell_type": "code", + "source": [ + "from sklearn.preprocessing import StandardScaler" + ], + "metadata": { + "id": "k4zq5GX8A-DO" + }, + "execution_count": 20, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "scaler=StandardScaler()\n", + "\n", + "X_train_std=scaler.fit_transform(X_train)\n", + "\n", + "X_test_std=scaler.transform(X_test)" + ], + "metadata": { + "id": "mgbv9nzqBZn9" + }, + "execution_count": 21, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "print(X_train_std)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "r97XLcgOB_S6", + "outputId": "4588a5e5-596c-48f5-a11b-2f6b83551673" + }, + "execution_count": 22, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[-0.01330339 1.7757658 -0.01491962 ... -0.13236958 -1.08014517\n", + " -0.03527943]\n", + " [-0.8448276 -0.6284278 -0.87702746 ... -1.11552632 -0.85773964\n", + " -0.72098905]\n", + " [ 1.44755936 0.71180168 1.47428816 ... 0.87583964 0.4967602\n", + " 0.46321706]\n", + " ...\n", + " [-0.46608541 -1.49375484 -0.53234924 ... -1.32388956 -1.02997851\n", + " -0.75145272]\n", + " [-0.50025764 -1.62161319 -0.527814 ... -0.0987626 0.35796577\n", + " -0.43906159]\n", + " [ 0.96060511 1.21181916 1.00427242 ... 0.8956983 -1.23064515\n", + " 0.50697397]]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "##**Building the Neural Network** \n", + "\n", + "![neural network.png]()" + ], + "metadata": { + "id": "11V_7aD3ypwk" + } + }, + { + "cell_type": "code", + "source": [ + "# importing tensorflow and keras\n", + "import tensorflow as tf\n", + "tf.random.set_seed(3)\n", + "from tensorflow import keras" + ], + "metadata": { + "id": "4gFqwyb5zk4F" + }, + "execution_count": 23, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "# setting up the layers for my neural network\n", + "model=keras.Sequential([\n", + " keras.layers.Flatten(input_shape=(30,)),\n", + " keras.layers.Dense(20,activation='relu'),\n", + " keras.layers.Dense(2,activation='sigmoid')\n", + "])" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "3CQ4PsbI2Rts", + "outputId": "8f75d7b7-fe03-4bdc-cf88-668d113097ee" + }, + "execution_count": 24, + "outputs": [ + { + "output_type": "stream", + "name": "stderr", + "text": [ + "/usr/local/lib/python3.10/dist-packages/keras/src/layers/reshaping/flatten.py:37: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.\n", + " super().__init__(**kwargs)\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "# compiling the nerual network\n", + "model.compile(optimizer='adam',\n", + " loss='sparse_categorical_crossentropy',\n", + " metrics=['accuracy'])" + ], + "metadata": { + "id": "2aecDJHe9YhD" + }, + "execution_count": 25, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "# training the neural network\n", + "\n", + "history=model.fit(X_train_std,Y_train,validation_split=0.1,epochs=10)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "SKhajeU-_WTi", + "outputId": "9dc5a6f7-1fa7-4df0-e21e-ff1b0a1f1f4c" + }, + "execution_count": 26, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Epoch 1/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m1s\u001b[0m 30ms/step - accuracy: 0.3608 - loss: 1.0537 - val_accuracy: 0.5652 - val_loss: 0.6574\n", + "Epoch 2/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 7ms/step - accuracy: 0.6294 - loss: 0.6775 - val_accuracy: 0.7609 - val_loss: 0.4467\n", + "Epoch 3/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 6ms/step - accuracy: 0.8020 - loss: 0.4507 - val_accuracy: 0.9130 - val_loss: 0.3312\n", + "Epoch 4/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 7ms/step - accuracy: 0.8936 - loss: 0.3233 - val_accuracy: 0.9348 - val_loss: 0.2647\n", + "Epoch 5/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 5ms/step - accuracy: 0.9204 - loss: 0.2509 - val_accuracy: 0.9348 - val_loss: 0.2237\n", + "Epoch 6/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 7ms/step - accuracy: 0.9397 - loss: 0.2069 - val_accuracy: 0.9565 - val_loss: 0.1959\n", + "Epoch 7/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 5ms/step - accuracy: 0.9506 - loss: 0.1781 - val_accuracy: 0.9565 - val_loss: 0.1757\n", + "Epoch 8/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 5ms/step - accuracy: 0.9551 - loss: 0.1579 - val_accuracy: 0.9565 - val_loss: 0.1603\n", + "Epoch 9/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 8ms/step - accuracy: 0.9551 - loss: 0.1429 - val_accuracy: 0.9565 - val_loss: 0.1483\n", + "Epoch 10/10\n", + "\u001b[1m13/13\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 7ms/step - accuracy: 0.9551 - loss: 0.1312 - val_accuracy: 0.9565 - val_loss: 0.1385\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "##**Visualising the accuracy and the loss**" + ], + "metadata": { + "id": "GEhDxgLtE0qF" + } + }, + { + "cell_type": "code", + "source": [ + "plt.plot(history.history['accuracy'])\n", + "plt.plot(history.history['val_accuracy'])\n", + "\n", + "plt.title('model-accuracy')\n", + "plt.ylabel('accuracy')\n", + "plt.xlabel('epoch')\n", + "\n", + "plt.legend(['training data','validation data'],loc='lower right')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 489 + }, + "id": "1l-CU0h3FMvi", + "outputId": "fb7c6f1b-de71-47f5-8876-a255526fba74" + }, + "execution_count": 27, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "" + ] + }, + "metadata": {}, + "execution_count": 27 + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "plt.plot(history.history['loss'])\n", + "plt.plot(history.history['val_loss'])\n", + "\n", + "plt.title('model-loss')\n", + "plt.ylabel('loss')\n", + "plt.xlabel('epoch')\n", + "\n", + "plt.legend(['training data','validation data'],loc='upper right')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 489 + }, + "id": "M7OmXFtJKk2l", + "outputId": "6e212930-8899-4458-c372-e3266c4c0f5b" + }, + "execution_count": 28, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "" + ] + }, + "metadata": {}, + "execution_count": 28 + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "##**Accuracy of the model on test data**" + ], + "metadata": { + "id": "-vj7sV97L2-w" + } + }, + { + "cell_type": "code", + "source": [ + "loss,accuracy=model.evaluate(X_test_std,Y_test)\n", + "print(accuracy)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "96w6x0qtL5-w", + "outputId": "7dcb237d-dd5c-49ca-d81e-718866569cd3" + }, + "execution_count": 29, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\u001b[1m4/4\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 7ms/step - accuracy: 0.9529 - loss: 0.1364 \n", + "0.9473684430122375\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "print(X_test_std.shape)\n", + "print(X_test_std[0])" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "RusDaCzqObG7", + "outputId": "1d6baa04-d162-47ad-dea1-a01d6ecc7bc2" + }, + "execution_count": 30, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "(114, 30)\n", + "[-0.04462793 -1.41612656 -0.05903514 -0.16234067 2.0202457 -0.11323672\n", + " 0.18500609 0.47102419 0.63336386 0.26335737 0.53209124 2.62763999\n", + " 0.62351167 0.11405261 1.01246781 0.41126289 0.63848593 2.88971815\n", + " -0.41675911 0.74270853 -0.32983699 -1.67435595 -0.36854552 -0.38767294\n", + " 0.32655007 -0.74858917 -0.54689089 -0.18278004 -1.23064515 -0.6268286 ]\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "Y_pred=model.predict(X_test_std)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "oEY126UrPiBQ", + "outputId": "f3f29157-3367-404f-fb29-9654a544413c" + }, + "execution_count": 31, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\u001b[1m4/4\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 12ms/step\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "print(Y_pred.shape)\n", + "print(Y_pred[0])" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "RsfqQF_DPvCH", + "outputId": "e8b4ee62-95a2-4cf1-a82e-df998113d032" + }, + "execution_count": 32, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "(114, 2)\n", + "[0.14741068 0.38797656]\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "print(X_test_std)\n" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "W-liSqxSQFcH", + "outputId": "fb72782c-9575-4545-8843-380a1bead062" + }, + "execution_count": 33, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[-0.04462793 -1.41612656 -0.05903514 ... -0.18278004 -1.23064515\n", + " -0.6268286 ]\n", + " [ 0.24583601 -0.06219797 0.21802678 ... 0.54129749 0.11047691\n", + " 0.0483572 ]\n", + " [-1.26115925 -0.29051645 -1.26499659 ... -1.35138617 0.269338\n", + " -0.28231213]\n", + " ...\n", + " [ 0.72709489 0.45836817 0.75277276 ... 1.46701686 1.19909344\n", + " 0.65319961]\n", + " [ 0.25437907 1.33054477 0.15659489 ... -1.29043534 -2.22561725\n", + " -1.59557344]\n", + " [ 0.84100232 -0.06676434 0.8929529 ... 2.15137705 0.35629355\n", + " 0.37459546]]\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "print(Y_pred)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "zG1k9lnnQZGo", + "outputId": "a2915c69-f2de-470b-b3a0-6f4029fdee0e" + }, + "execution_count": 34, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[[1.47410676e-01 3.87976557e-01]\n", + " [3.56368840e-01 5.18990397e-01]\n", + " [8.17896351e-02 8.88861656e-01]\n", + " [9.79850113e-01 1.42635719e-04]\n", + " [4.96069491e-01 6.40939593e-01]\n", + " [8.14233422e-01 6.70213718e-03]\n", + " [3.58982205e-01 7.74345934e-01]\n", + " [5.15166633e-02 8.40561211e-01]\n", + " [1.74263716e-01 8.45038652e-01]\n", + " [6.91979751e-02 7.60101020e-01]\n", + " [3.42772096e-01 4.71939981e-01]\n", + " [1.95462808e-01 7.80927837e-01]\n", + " [1.25622064e-01 6.79924786e-01]\n", + " [2.36827940e-01 6.47520542e-01]\n", + " [1.73515439e-01 8.83262813e-01]\n", + " [4.54495728e-01 1.66123912e-01]\n", + " [7.14207590e-02 8.00487936e-01]\n", + " [6.75703362e-02 8.28172982e-01]\n", + " [2.72525311e-01 8.96298707e-01]\n", + " [7.55281687e-01 2.12847684e-02]\n", + " [1.47410437e-01 9.35346961e-01]\n", + " [9.94631127e-02 7.20759630e-01]\n", + " [4.91060726e-02 8.04541647e-01]\n", + " [8.06859136e-02 8.15190315e-01]\n", + " [2.09953293e-01 7.70186722e-01]\n", + " [6.55250907e-01 5.24848960e-02]\n", + " [2.43628517e-01 6.16564453e-01]\n", + " [4.06237453e-01 5.81755459e-01]\n", + " [5.53256810e-01 2.01370031e-01]\n", + " [6.15948796e-01 4.13672999e-02]\n", + " [1.16955131e-01 6.92455769e-01]\n", + " [1.51835799e-01 8.64175141e-01]\n", + " [1.24892898e-01 7.96837449e-01]\n", + " [9.04566705e-01 5.27114794e-03]\n", + " [8.14052641e-01 6.10142201e-03]\n", + " [1.88847557e-01 5.20085216e-01]\n", + " [1.81938075e-02 7.41403461e-01]\n", + " [1.32157281e-01 5.95606744e-01]\n", + " [5.96628413e-02 8.23325336e-01]\n", + " [1.47057727e-01 8.43396306e-01]\n", + " [9.35085654e-01 1.44123638e-04]\n", + " [5.91420591e-01 3.30836058e-01]\n", + " [1.11651914e-02 3.28211099e-01]\n", + " [1.45664781e-01 8.49537253e-01]\n", + " [7.84874499e-01 2.68248767e-01]\n", + " [1.06081858e-01 8.27520132e-01]\n", + " [1.39571577e-01 9.38089669e-01]\n", + " [7.81977326e-02 8.93882036e-01]\n", + " [7.27857172e-01 7.77330920e-02]\n", + " [6.97005391e-01 5.91000989e-02]\n", + " [8.95728841e-02 8.02264571e-01]\n", + " [5.06602407e-01 2.13011101e-01]\n", + " [2.15893194e-01 2.28696615e-01]\n", + " [1.61636800e-01 8.08854222e-01]\n", + " [1.56091899e-01 8.99078488e-01]\n", + " [4.92944956e-01 5.16029596e-01]\n", + " [6.48338497e-02 5.45135736e-01]\n", + " [1.78481624e-01 9.69128191e-01]\n", + " [9.21820045e-01 1.14284776e-01]\n", + " [2.61452436e-01 9.00870383e-01]\n", + " [4.22357112e-01 6.79449975e-01]\n", + " [6.07607543e-01 9.39280689e-02]\n", + " [8.62012133e-02 8.36352408e-01]\n", + " [8.70399535e-01 1.47698363e-02]\n", + " [5.99702358e-01 1.65063500e-01]\n", + " [4.22271132e-01 5.33653498e-01]\n", + " [7.64765203e-01 1.51314465e-02]\n", + " [7.66184628e-01 1.50238648e-01]\n", + " [1.09157279e-01 3.24450940e-01]\n", + " [7.32976854e-01 7.75116324e-01]\n", + " [3.81087363e-01 1.50774464e-01]\n", + " [8.12568367e-01 6.42300993e-02]\n", + " [1.74612567e-01 8.76205683e-01]\n", + " [6.64195657e-01 1.78310886e-01]\n", + " [7.17609152e-02 8.92448843e-01]\n", + " [7.36038983e-01 1.04945749e-01]\n", + " [1.13246948e-01 8.52887630e-01]\n", + " [1.04686759e-01 8.94683838e-01]\n", + " [3.51051062e-01 7.63631940e-01]\n", + " [6.78609431e-01 2.62374759e-01]\n", + " [6.50655091e-01 8.00860301e-03]\n", + " [6.48401082e-01 1.13665223e-01]\n", + " [8.12505901e-01 1.40899057e-02]\n", + " [2.30170950e-01 7.72276759e-01]\n", + " [1.94433168e-01 7.50467658e-01]\n", + " [2.81481236e-01 2.52196819e-01]\n", + " [8.14478621e-02 8.66267025e-01]\n", + " [1.68887153e-01 8.68300676e-01]\n", + " [2.58163542e-01 7.41350114e-01]\n", + " [9.00962114e-01 7.07493536e-03]\n", + " [1.71535254e-01 8.94580781e-01]\n", + " [8.60500559e-02 4.98417109e-01]\n", + " [7.70302266e-02 8.14002991e-01]\n", + " [2.99079001e-01 1.51752317e-02]\n", + " [4.85344589e-01 1.63270041e-01]\n", + " [3.15282047e-01 7.90184855e-01]\n", + " [7.73902416e-01 9.64527391e-03]\n", + " [8.32077622e-01 2.17362903e-02]\n", + " [9.52037871e-02 5.96800566e-01]\n", + " [7.02848956e-02 8.72986794e-01]\n", + " [3.64694707e-02 8.88887167e-01]\n", + " [6.98904574e-01 1.97382331e-01]\n", + " [7.88161755e-01 9.52440128e-03]\n", + " [9.00099695e-01 1.46035792e-03]\n", + " [9.61634889e-02 6.85296476e-01]\n", + " [6.86309040e-02 9.09845293e-01]\n", + " [4.61889878e-02 8.18597913e-01]\n", + " [9.97853130e-02 9.15630996e-01]\n", + " [1.42511884e-02 9.90459144e-01]\n", + " [2.43416041e-01 5.43159842e-01]\n", + " [5.98811209e-01 1.38111971e-02]\n", + " [9.04361248e-01 2.83507463e-02]\n", + " [2.89724588e-01 4.72831637e-01]\n", + " [7.61420429e-01 6.33765683e-02]]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "model.predict() gives the prediction probability of each class for that datapoint" + ], + "metadata": { + "id": "tAJ2sU_bQld1" + } + }, + { + "cell_type": "code", + "source": [ + "# argmax function\n", + "my_list=[0.25,0.56]\n", + "\n", + "index_of_max_value=np.argmax(my_list)\n", + "print(my_list)\n", + "print(index_of_max_value)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "Uinuyosl1bbV", + "outputId": "a20d7410-6efd-4568-f863-6934859723da" + }, + "execution_count": 38, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[0.25, 0.56]\n", + "1\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "# converting the prediction probability to class labels\n", + "Y_pred_labels=[np.argmax(i) for i in Y_pred]\n", + "print(Y_pred_labels)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "9AmxrS7B3k6F", + "outputId": "8ff717c7-3c3d-4573-c8cb-c52346ac3c35" + }, + "execution_count": 40, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "[1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0]\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "source": [ + "##**Building the predictive system**" + ], + "metadata": { + "id": "FxbFQJt84j2K" + } + }, + { + "cell_type": "code", + "source": [ + "input_data=(11.76,21.6,74.72,427.9,0.08637,0.04966,0.01657,0.01115,0.1495,0.05888,0.4062,1.21,2.635,28.47,0.005857,0.009758,0.01168,0.007445,0.02406,0.001769,12.98,25.72,82.98,516.5,0.1085,0.08615,0.05523,0.03715,0.2433,0.06563)\n", + "\n", + "# change the input data to a numpy array\n", + "input_data_as_numpy_array=np.asarray(input_data)\n", + "\n", + "# reshape the numpy array as we are predicting for one data point\n", + "input_data_reshaped=input_data_as_numpy_array.reshape(1,-1)\n", + "\n", + "#standardizing the input data\n", + "input_data_std=scaler.transform(input_data_reshaped)\n", + "\n", + "prediction=model.predict(input_data_std)\n", + "print(prediction)\n", + "\n", + "prediction_label=[np.argmax(prediction)]\n", + "print(prediction_label)\n", + "\n", + "if(prediction_label[0]==0):\n", + " print('The tumor is Malignant')\n", + "else:\n", + " print('The tumor is Benign')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "GoOQ6rOG4gs_", + "outputId": "a83949d0-158e-4ec8-e443-c9254ee2ca34" + }, + "execution_count": 41, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\u001b[1m1/1\u001b[0m \u001b[32m━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[37m\u001b[0m \u001b[1m0s\u001b[0m 40ms/step\n", + "[[0.09100164 0.721266 ]]\n", + "[1]\n", + "The tumor is Benign\n" + ] + }, + { + "output_type": "stream", + "name": "stderr", + "text": [ + "/usr/local/lib/python3.10/dist-packages/sklearn/base.py:493: UserWarning: X does not have valid feature names, but StandardScaler was fitted with feature names\n", + " warnings.warn(\n" + ] + } + ] + } + ] +} \ No newline at end of file