{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd \n", "import numpy as np\n", "import seaborn as sns" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "pcos_df = pd.read_csv(\"PCOS_data.csv\")" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | Sl. No | \n", "Patient File No. | \n", "PCOS (Y/N) | \n", "Age (yrs) | \n", "Weight (Kg) | \n", "Height(Cm) | \n", "BMI | \n", "Blood Group | \n", "Pulse rate(bpm) | \n", "RR (breaths/min) | \n", "... | \n", "Fast food (Y/N) | \n", "Reg.Exercise(Y/N) | \n", "BP _Systolic (mmHg) | \n", "BP _Diastolic (mmHg) | \n", "Follicle No. (L) | \n", "Follicle No. (R) | \n", "Avg. F size (L) (mm) | \n", "Avg. F size (R) (mm) | \n", "Endometrium (mm) | \n", "Column1 | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "1 | \n", "1 | \n", "0 | \n", "28 | \n", "44.6 | \n", "152.0 | \n", "19.3 | \n", "15 | \n", "78 | \n", "22 | \n", "... | \n", "1.0 | \n", "0 | \n", "110 | \n", "80 | \n", "3 | \n", "3 | \n", "18.0 | \n", "18.0 | \n", "8.5 | \n", "NaN | \n", "
| 1 | \n", "2 | \n", "2 | \n", "0 | \n", "36 | \n", "65.0 | \n", "161.5 | \n", "24.9 | \n", "15 | \n", "74 | \n", "20 | \n", "... | \n", "0.0 | \n", "0 | \n", "120 | \n", "70 | \n", "3 | \n", "5 | \n", "15.0 | \n", "14.0 | \n", "3.7 | \n", "NaN | \n", "
| 2 | \n", "3 | \n", "3 | \n", "1 | \n", "33 | \n", "68.8 | \n", "165.0 | \n", "25.3 | \n", "11 | \n", "72 | \n", "18 | \n", "... | \n", "1.0 | \n", "0 | \n", "120 | \n", "80 | \n", "13 | \n", "15 | \n", "18.0 | \n", "20.0 | \n", "10.0 | \n", "NaN | \n", "
| 3 | \n", "4 | \n", "4 | \n", "0 | \n", "37 | \n", "65.0 | \n", "148.0 | \n", "29.7 | \n", "13 | \n", "72 | \n", "20 | \n", "... | \n", "0.0 | \n", "0 | \n", "120 | \n", "70 | \n", "2 | \n", "2 | \n", "15.0 | \n", "14.0 | \n", "7.5 | \n", "NaN | \n", "
| 4 | \n", "5 | \n", "5 | \n", "0 | \n", "25 | \n", "52.0 | \n", "161.0 | \n", "20.1 | \n", "11 | \n", "72 | \n", "18 | \n", "... | \n", "0.0 | \n", "0 | \n", "120 | \n", "80 | \n", "3 | \n", "4 | \n", "16.0 | \n", "14.0 | \n", "7.0 | \n", "NaN | \n", "
5 rows × 45 columns
\n", "| \n", " | Sl. No | \n", "Patient File No. | \n", "PCOS (Y/N) | \n", "Age (yrs) | \n", "Weight (Kg) | \n", "Height(Cm) | \n", "BMI | \n", "Blood Group | \n", "Pulse rate(bpm) | \n", "RR (breaths/min) | \n", "... | \n", "Pimples(Y/N) | \n", "Fast food (Y/N) | \n", "Reg.Exercise(Y/N) | \n", "BP _Systolic (mmHg) | \n", "BP _Diastolic (mmHg) | \n", "Follicle No. (L) | \n", "Follicle No. (R) | \n", "Avg. F size (L) (mm) | \n", "Avg. F size (R) (mm) | \n", "Endometrium (mm) | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| count | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "... | \n", "541.000000 | \n", "540.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "
| mean | \n", "271.000000 | \n", "271.000000 | \n", "0.327172 | \n", "31.430684 | \n", "59.637153 | \n", "156.484835 | \n", "24.307579 | \n", "13.802218 | \n", "73.247689 | \n", "19.243993 | \n", "... | \n", "0.489834 | \n", "0.514815 | \n", "0.247689 | \n", "114.661738 | \n", "76.927911 | \n", "6.129390 | \n", "6.641405 | \n", "15.018115 | \n", "15.451701 | \n", "8.475915 | \n", "
| std | \n", "156.317519 | \n", "156.317519 | \n", "0.469615 | \n", "5.411006 | \n", "11.028287 | \n", "6.033545 | \n", "4.055129 | \n", "1.840812 | \n", "4.430285 | \n", "1.688629 | \n", "... | \n", "0.500359 | \n", "0.500244 | \n", "0.432070 | \n", "7.384556 | \n", "5.574112 | \n", "4.229294 | \n", "4.436889 | \n", "3.566839 | \n", "3.318848 | \n", "2.165381 | \n", "
| min | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "20.000000 | \n", "31.000000 | \n", "137.000000 | \n", "12.400000 | \n", "11.000000 | \n", "13.000000 | \n", "16.000000 | \n", "... | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "12.000000 | \n", "8.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
| 25% | \n", "136.000000 | \n", "136.000000 | \n", "0.000000 | \n", "28.000000 | \n", "52.000000 | \n", "152.000000 | \n", "21.600000 | \n", "13.000000 | \n", "72.000000 | \n", "18.000000 | \n", "... | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "110.000000 | \n", "70.000000 | \n", "3.000000 | \n", "3.000000 | \n", "13.000000 | \n", "13.000000 | \n", "7.000000 | \n", "
| 50% | \n", "271.000000 | \n", "271.000000 | \n", "0.000000 | \n", "31.000000 | \n", "59.000000 | \n", "156.000000 | \n", "24.200000 | \n", "14.000000 | \n", "72.000000 | \n", "18.000000 | \n", "... | \n", "0.000000 | \n", "1.000000 | \n", "0.000000 | \n", "110.000000 | \n", "80.000000 | \n", "5.000000 | \n", "6.000000 | \n", "15.000000 | \n", "16.000000 | \n", "8.500000 | \n", "
| 75% | \n", "406.000000 | \n", "406.000000 | \n", "1.000000 | \n", "35.000000 | \n", "65.000000 | \n", "160.000000 | \n", "26.600000 | \n", "15.000000 | \n", "74.000000 | \n", "20.000000 | \n", "... | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "120.000000 | \n", "80.000000 | \n", "9.000000 | \n", "10.000000 | \n", "18.000000 | \n", "18.000000 | \n", "9.800000 | \n", "
| max | \n", "541.000000 | \n", "541.000000 | \n", "1.000000 | \n", "48.000000 | \n", "108.000000 | \n", "180.000000 | \n", "38.900000 | \n", "18.000000 | \n", "82.000000 | \n", "28.000000 | \n", "... | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "140.000000 | \n", "100.000000 | \n", "22.000000 | \n", "20.000000 | \n", "24.000000 | \n", "24.000000 | \n", "18.000000 | \n", "
8 rows × 42 columns
\n", "| \n", " | PCOS (Y/N) | \n", "Age (yrs) | \n", "Weight (Kg) | \n", "Height(Cm) | \n", "BMI | \n", "Blood Group | \n", "Pulse rate(bpm) | \n", "RR (breaths/min) | \n", "Hb(g/dl) | \n", "Cycle(R/I) | \n", "... | \n", "Pimples(Y/N) | \n", "Fast food (Y/N) | \n", "Reg.Exercise(Y/N) | \n", "BP _Systolic (mmHg) | \n", "BP _Diastolic (mmHg) | \n", "Follicle No. (L) | \n", "Follicle No. (R) | \n", "Avg. F size (L) (mm) | \n", "Avg. F size (R) (mm) | \n", "Endometrium (mm) | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| count | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "... | \n", "541.000000 | \n", "540.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "541.000000 | \n", "
| mean | \n", "0.327172 | \n", "31.430684 | \n", "59.637153 | \n", "156.484835 | \n", "24.307579 | \n", "13.802218 | \n", "73.247689 | \n", "19.243993 | \n", "11.160037 | \n", "0.279113 | \n", "... | \n", "0.489834 | \n", "0.514815 | \n", "0.247689 | \n", "114.661738 | \n", "76.927911 | \n", "6.129390 | \n", "6.641405 | \n", "15.018115 | \n", "15.451701 | \n", "8.475915 | \n", "
| std | \n", "0.469615 | \n", "5.411006 | \n", "11.028287 | \n", "6.033545 | \n", "4.055129 | \n", "1.840812 | \n", "4.430285 | \n", "1.688629 | \n", "0.866904 | \n", "0.448978 | \n", "... | \n", "0.500359 | \n", "0.500244 | \n", "0.432070 | \n", "7.384556 | \n", "5.574112 | \n", "4.229294 | \n", "4.436889 | \n", "3.566839 | \n", "3.318848 | \n", "2.165381 | \n", "
| min | \n", "0.000000 | \n", "20.000000 | \n", "31.000000 | \n", "137.000000 | \n", "12.400000 | \n", "11.000000 | \n", "13.000000 | \n", "16.000000 | \n", "8.500000 | \n", "0.000000 | \n", "... | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "12.000000 | \n", "8.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
| 25% | \n", "0.000000 | \n", "28.000000 | \n", "52.000000 | \n", "152.000000 | \n", "21.600000 | \n", "13.000000 | \n", "72.000000 | \n", "18.000000 | \n", "10.500000 | \n", "0.000000 | \n", "... | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "110.000000 | \n", "70.000000 | \n", "3.000000 | \n", "3.000000 | \n", "13.000000 | \n", "13.000000 | \n", "7.000000 | \n", "
| 50% | \n", "0.000000 | \n", "31.000000 | \n", "59.000000 | \n", "156.000000 | \n", "24.200000 | \n", "14.000000 | \n", "72.000000 | \n", "18.000000 | \n", "11.000000 | \n", "0.000000 | \n", "... | \n", "0.000000 | \n", "1.000000 | \n", "0.000000 | \n", "110.000000 | \n", "80.000000 | \n", "5.000000 | \n", "6.000000 | \n", "15.000000 | \n", "16.000000 | \n", "8.500000 | \n", "
| 75% | \n", "1.000000 | \n", "35.000000 | \n", "65.000000 | \n", "160.000000 | \n", "26.600000 | \n", "15.000000 | \n", "74.000000 | \n", "20.000000 | \n", "11.700000 | \n", "1.000000 | \n", "... | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "120.000000 | \n", "80.000000 | \n", "9.000000 | \n", "10.000000 | \n", "18.000000 | \n", "18.000000 | \n", "9.800000 | \n", "
| max | \n", "1.000000 | \n", "48.000000 | \n", "108.000000 | \n", "180.000000 | \n", "38.900000 | \n", "18.000000 | \n", "82.000000 | \n", "28.000000 | \n", "14.800000 | \n", "1.000000 | \n", "... | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "140.000000 | \n", "100.000000 | \n", "22.000000 | \n", "20.000000 | \n", "24.000000 | \n", "24.000000 | \n", "18.000000 | \n", "
8 rows × 42 columns
\n", "