{ "cells": [ { "cell_type": "code", "execution_count": 2, "id": "initial_id", "metadata": { "collapsed": true, "ExecuteTime": { "end_time": "2024-03-03T12:37:14.219767Z", "start_time": "2024-03-03T12:37:14.199729Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " id diagnosis radius_mean texture_mean perimeter_mean area_mean \\\n", "0 842302 M 17.99 10.38 122.80 1001.0 \n", "1 842517 M 20.57 17.77 132.90 1326.0 \n", "2 84300903 M 19.69 21.25 130.00 1203.0 \n", "3 84348301 M 11.42 20.38 77.58 386.1 \n", "4 84358402 M 20.29 14.34 135.10 1297.0 \n", "\n", " smoothness_mean compactness_mean concavity_mean concave points_mean \\\n", "0 0.11840 0.27760 0.3001 0.14710 \n", "1 0.08474 0.07864 0.0869 0.07017 \n", "2 0.10960 0.15990 0.1974 0.12790 \n", "3 0.14250 0.28390 0.2414 0.10520 \n", "4 0.10030 0.13280 0.1980 0.10430 \n", "\n", " ... radius_worst texture_worst perimeter_worst area_worst \\\n", "0 ... 25.38 17.33 184.60 2019.0 \n", "1 ... 24.99 23.41 158.80 1956.0 \n", "2 ... 23.57 25.53 152.50 1709.0 \n", "3 ... 14.91 26.50 98.87 567.7 \n", "4 ... 22.54 16.67 152.20 1575.0 \n", "\n", " smoothness_worst compactness_worst concavity_worst concave_points_worst \\\n", "0 0.1622 0.6656 0.7119 0.2654 \n", "1 0.1238 0.1866 0.2416 0.1860 \n", "2 0.1444 0.4245 0.4504 0.2430 \n", "3 0.2098 0.8663 0.6869 0.2575 \n", "4 0.1374 0.2050 0.4000 0.1625 \n", "\n", " symmetry_worst fractal_dimension_worst \n", "0 0.4601 0.11890 \n", "1 0.2750 0.08902 \n", "2 0.3613 0.08758 \n", "3 0.6638 0.17300 \n", "4 0.2364 0.07678 \n", "\n", "[5 rows x 32 columns]\n" ] } ], "source": [ "import pandas as pd\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.naive_bayes import GaussianNB\n", "from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score\n", "\n", "data = pd.read_csv(\"bc_data.csv\")\n", "print(data.head())" ] }, { "cell_type": "code", "outputs": [ { "data": { "text/plain": " id radius_mean texture_mean perimeter_mean area_mean \\\ncount 5.690000e+02 569.000000 569.000000 569.000000 569.000000 \nmean 3.037183e+07 14.127292 19.289649 91.969033 654.889104 \nstd 1.250206e+08 3.524049 4.301036 24.298981 351.914129 \nmin 8.670000e+03 6.981000 9.710000 43.790000 143.500000 \n25% 8.692180e+05 11.700000 16.170000 75.170000 420.300000 \n50% 9.060240e+05 13.370000 18.840000 86.240000 551.100000 \n75% 8.813129e+06 15.780000 21.800000 104.100000 782.700000 \nmax 9.113205e+08 28.110000 39.280000 188.500000 2501.000000 \n\n smoothness_mean compactness_mean concavity_mean concave points_mean \\\ncount 569.000000 569.000000 569.000000 569.000000 \nmean 0.096360 0.104341 0.088799 0.048919 \nstd 0.014064 0.052813 0.079720 0.038803 \nmin 0.052630 0.019380 0.000000 0.000000 \n25% 0.086370 0.064920 0.029560 0.020310 \n50% 0.095870 0.092630 0.061540 0.033500 \n75% 0.105300 0.130400 0.130700 0.074000 \nmax 0.163400 0.345400 0.426800 0.201200 \n\n symmetry_mean ... radius_worst texture_worst perimeter_worst \\\ncount 569.000000 ... 569.000000 569.000000 569.000000 \nmean 0.181162 ... 16.269190 25.677223 107.261213 \nstd 0.027414 ... 4.833242 6.146258 33.602542 \nmin 0.106000 ... 7.930000 12.020000 50.410000 \n25% 0.161900 ... 13.010000 21.080000 84.110000 \n50% 0.179200 ... 14.970000 25.410000 97.660000 \n75% 0.195700 ... 18.790000 29.720000 125.400000 \nmax 0.304000 ... 36.040000 49.540000 251.200000 \n\n area_worst smoothness_worst compactness_worst concavity_worst \\\ncount 569.000000 569.000000 569.000000 569.000000 \nmean 880.583128 0.132369 0.254265 0.272188 \nstd 569.356993 0.022832 0.157336 0.208624 \nmin 185.200000 0.071170 0.027290 0.000000 \n25% 515.300000 0.116600 0.147200 0.114500 \n50% 686.500000 0.131300 0.211900 0.226700 \n75% 1084.000000 0.146000 0.339100 0.382900 \nmax 4254.000000 0.222600 1.058000 1.252000 \n\n concave_points_worst symmetry_worst fractal_dimension_worst \ncount 569.000000 569.000000 569.000000 \nmean 0.114606 0.290076 0.083946 \nstd 0.065732 0.061867 0.018061 \nmin 0.000000 0.156500 0.055040 \n25% 0.064930 0.250400 0.071460 \n50% 0.099930 0.282200 0.080040 \n75% 0.161400 0.317900 0.092080 \nmax 0.291000 0.663800 0.207500 \n\n[8 rows x 31 columns]", "text/html": "
| \n | id | \nradius_mean | \ntexture_mean | \nperimeter_mean | \narea_mean | \nsmoothness_mean | \ncompactness_mean | \nconcavity_mean | \nconcave points_mean | \nsymmetry_mean | \n... | \nradius_worst | \ntexture_worst | \nperimeter_worst | \narea_worst | \nsmoothness_worst | \ncompactness_worst | \nconcavity_worst | \nconcave_points_worst | \nsymmetry_worst | \nfractal_dimension_worst | \n
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| count | \n5.690000e+02 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n... | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n569.000000 | \n
| mean | \n3.037183e+07 | \n14.127292 | \n19.289649 | \n91.969033 | \n654.889104 | \n0.096360 | \n0.104341 | \n0.088799 | \n0.048919 | \n0.181162 | \n... | \n16.269190 | \n25.677223 | \n107.261213 | \n880.583128 | \n0.132369 | \n0.254265 | \n0.272188 | \n0.114606 | \n0.290076 | \n0.083946 | \n
| std | \n1.250206e+08 | \n3.524049 | \n4.301036 | \n24.298981 | \n351.914129 | \n0.014064 | \n0.052813 | \n0.079720 | \n0.038803 | \n0.027414 | \n... | \n4.833242 | \n6.146258 | \n33.602542 | \n569.356993 | \n0.022832 | \n0.157336 | \n0.208624 | \n0.065732 | \n0.061867 | \n0.018061 | \n
| min | \n8.670000e+03 | \n6.981000 | \n9.710000 | \n43.790000 | \n143.500000 | \n0.052630 | \n0.019380 | \n0.000000 | \n0.000000 | \n0.106000 | \n... | \n7.930000 | \n12.020000 | \n50.410000 | \n185.200000 | \n0.071170 | \n0.027290 | \n0.000000 | \n0.000000 | \n0.156500 | \n0.055040 | \n
| 25% | \n8.692180e+05 | \n11.700000 | \n16.170000 | \n75.170000 | \n420.300000 | \n0.086370 | \n0.064920 | \n0.029560 | \n0.020310 | \n0.161900 | \n... | \n13.010000 | \n21.080000 | \n84.110000 | \n515.300000 | \n0.116600 | \n0.147200 | \n0.114500 | \n0.064930 | \n0.250400 | \n0.071460 | \n
| 50% | \n9.060240e+05 | \n13.370000 | \n18.840000 | \n86.240000 | \n551.100000 | \n0.095870 | \n0.092630 | \n0.061540 | \n0.033500 | \n0.179200 | \n... | \n14.970000 | \n25.410000 | \n97.660000 | \n686.500000 | \n0.131300 | \n0.211900 | \n0.226700 | \n0.099930 | \n0.282200 | \n0.080040 | \n
| 75% | \n8.813129e+06 | \n15.780000 | \n21.800000 | \n104.100000 | \n782.700000 | \n0.105300 | \n0.130400 | \n0.130700 | \n0.074000 | \n0.195700 | \n... | \n18.790000 | \n29.720000 | \n125.400000 | \n1084.000000 | \n0.146000 | \n0.339100 | \n0.382900 | \n0.161400 | \n0.317900 | \n0.092080 | \n
| max | \n9.113205e+08 | \n28.110000 | \n39.280000 | \n188.500000 | \n2501.000000 | \n0.163400 | \n0.345400 | \n0.426800 | \n0.201200 | \n0.304000 | \n... | \n36.040000 | \n49.540000 | \n251.200000 | \n4254.000000 | \n0.222600 | \n1.058000 | \n1.252000 | \n0.291000 | \n0.663800 | \n0.207500 | \n
8 rows × 31 columns
\nGaussianNB()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
GaussianNB()
GridSearchCV(cv=5, estimator=GaussianNB(),\n param_grid={'var_smoothing': [1e-07, 1e-08, 1e-09, 1e-10, 1e-11,\n 1e-12]},\n scoring='accuracy')In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. GridSearchCV(cv=5, estimator=GaussianNB(),\n param_grid={'var_smoothing': [1e-07, 1e-08, 1e-09, 1e-10, 1e-11,\n 1e-12]},\n scoring='accuracy')GaussianNB()
GaussianNB()