{ "cells": [ { "cell_type": "markdown", "metadata": { "id": "nweeTgBaO6TC" }, "source": [ "### Data Inspection" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "QTltTIC0G5yR" }, "outputs": [], "source": [ "import pandas as pd\n", "df= pd.read_csv('/content/healthcare-dataset-stroke-data.csv')" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 261 }, "id": "Hks8hmojJ5LJ", "outputId": "1b110403-b334-4572-9f06-546913b46fcb" }, "outputs": [ { "data": { "application/vnd.google.colaboratory.intrinsic+json": { "summary": "{\n \"name\": \"df\",\n \"rows\": 5110,\n \"fields\": [\n {\n \"column\": \"id\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 21161,\n \"min\": 67,\n \"max\": 72940,\n \"num_unique_values\": 5110,\n \"samples\": [\n 40041,\n 55244,\n 70992\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"gender\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 3,\n \"samples\": [\n \"Male\",\n \"Female\",\n \"Other\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"age\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 22.61264672311352,\n \"min\": 0.08,\n \"max\": 82.0,\n \"num_unique_values\": 104,\n \"samples\": [\n 45.0,\n 24.0,\n 33.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"hypertension\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n \"samples\": [\n 1,\n 0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"heart_disease\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n \"samples\": [\n 0,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"ever_married\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"No\",\n \"Yes\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"work_type\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 5,\n \"samples\": [\n \"Self-employed\",\n \"Never_worked\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Residence_type\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"Rural\",\n \"Urban\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"avg_glucose_level\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 45.28356015058203,\n \"min\": 55.12,\n \"max\": 271.74,\n \"num_unique_values\": 3979,\n \"samples\": [\n 178.29,\n 156.69\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bmi\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 7.854066729680158,\n \"min\": 10.3,\n \"max\": 97.6,\n \"num_unique_values\": 418,\n \"samples\": [\n 49.5,\n 18.5\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"smoking_status\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"never smoked\",\n \"Unknown\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"stroke\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n \"samples\": [\n 0,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}", "type": "dataframe", "variable_name": "df" }, "text/html": [ "\n", "
| \n", " | id | \n", "gender | \n", "age | \n", "hypertension | \n", "heart_disease | \n", "ever_married | \n", "work_type | \n", "Residence_type | \n", "avg_glucose_level | \n", "bmi | \n", "smoking_status | \n", "stroke | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "9046 | \n", "Male | \n", "67.0 | \n", "0 | \n", "1 | \n", "Yes | \n", "Private | \n", "Urban | \n", "228.69 | \n", "36.6 | \n", "formerly smoked | \n", "1 | \n", "
| 1 | \n", "51676 | \n", "Female | \n", "61.0 | \n", "0 | \n", "0 | \n", "Yes | \n", "Self-employed | \n", "Rural | \n", "202.21 | \n", "NaN | \n", "never smoked | \n", "1 | \n", "
| 2 | \n", "31112 | \n", "Male | \n", "80.0 | \n", "0 | \n", "1 | \n", "Yes | \n", "Private | \n", "Rural | \n", "105.92 | \n", "32.5 | \n", "never smoked | \n", "1 | \n", "
| 3 | \n", "60182 | \n", "Female | \n", "49.0 | \n", "0 | \n", "0 | \n", "Yes | \n", "Private | \n", "Urban | \n", "171.23 | \n", "34.4 | \n", "smokes | \n", "1 | \n", "
| 4 | \n", "1665 | \n", "Female | \n", "79.0 | \n", "1 | \n", "0 | \n", "Yes | \n", "Self-employed | \n", "Rural | \n", "174.12 | \n", "24.0 | \n", "never smoked | \n", "1 | \n", "
| \n", " | id | \n", "gender | \n", "age | \n", "hypertension | \n", "heart_disease | \n", "ever_married | \n", "work_type | \n", "Residence_type | \n", "avg_glucose_level | \n", "bmi | \n", "smoking_status | \n", "stroke | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| count | \n", "5110.000000 | \n", "5110 | \n", "5110.000000 | \n", "5110.000000 | \n", "5110.000000 | \n", "5110 | \n", "5110 | \n", "5110 | \n", "5110.000000 | \n", "4909.000000 | \n", "5110 | \n", "5110.000000 | \n", "
| unique | \n", "NaN | \n", "3 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "2 | \n", "5 | \n", "2 | \n", "NaN | \n", "NaN | \n", "4 | \n", "NaN | \n", "
| top | \n", "NaN | \n", "Female | \n", "NaN | \n", "NaN | \n", "NaN | \n", "Yes | \n", "Private | \n", "Urban | \n", "NaN | \n", "NaN | \n", "never smoked | \n", "NaN | \n", "
| freq | \n", "NaN | \n", "2994 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "3353 | \n", "2925 | \n", "2596 | \n", "NaN | \n", "NaN | \n", "1892 | \n", "NaN | \n", "
| mean | \n", "36517.829354 | \n", "NaN | \n", "43.226614 | \n", "0.097456 | \n", "0.054012 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "106.147677 | \n", "28.893237 | \n", "NaN | \n", "0.048728 | \n", "
| std | \n", "21161.721625 | \n", "NaN | \n", "22.612647 | \n", "0.296607 | \n", "0.226063 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "45.283560 | \n", "7.854067 | \n", "NaN | \n", "0.215320 | \n", "
| min | \n", "67.000000 | \n", "NaN | \n", "0.080000 | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "55.120000 | \n", "10.300000 | \n", "NaN | \n", "0.000000 | \n", "
| 25% | \n", "17741.250000 | \n", "NaN | \n", "25.000000 | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "77.245000 | \n", "23.500000 | \n", "NaN | \n", "0.000000 | \n", "
| 50% | \n", "36932.000000 | \n", "NaN | \n", "45.000000 | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "91.885000 | \n", "28.100000 | \n", "NaN | \n", "0.000000 | \n", "
| 75% | \n", "54682.000000 | \n", "NaN | \n", "61.000000 | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "114.090000 | \n", "33.100000 | \n", "NaN | \n", "0.000000 | \n", "
| max | \n", "72940.000000 | \n", "NaN | \n", "82.000000 | \n", "1.000000 | \n", "1.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "271.740000 | \n", "97.600000 | \n", "NaN | \n", "1.000000 | \n", "
| \n", " | 0 | \n", "
|---|---|
| id | \n", "0 | \n", "
| gender | \n", "0 | \n", "
| age | \n", "0 | \n", "
| hypertension | \n", "0 | \n", "
| heart_disease | \n", "0 | \n", "
| ever_married | \n", "0 | \n", "
| work_type | \n", "0 | \n", "
| Residence_type | \n", "0 | \n", "
| avg_glucose_level | \n", "0 | \n", "
| bmi | \n", "201 | \n", "
| smoking_status | \n", "0 | \n", "
| stroke | \n", "0 | \n", "
| \n", " | count | \n", "
|---|---|
| stroke | \n", "\n", " |
| 0 | \n", "3889 | \n", "
| 1 | \n", "199 | \n", "
Enter patient details and get a predicted stroke probability.
\n", "\n", " {% if error %}\n", "Predicted Stroke Probability: {{ '%.3f'|format(result.stroke_probability) }}
\n", "Predicted Label (1 = Stroke): {{ result.predicted_label }}
\n", "POST /predict with JSON:\n",
" \n",
"{\n",
" \"gender\":\"Female\",\n",
" \"age\":45,\n",
" \"hypertension\":0,\n",
" \"heart_disease\":0,\n",
" \"ever_married\":\"Yes\",\n",
" \"work_type\":\"Private\",\n",
" \"Residence_type\":\"Urban\",\n",
" \"avg_glucose_level\":95.0,\n",
" \"bmi\":28.0,\n",
" \"smoking_status\":\"never smoked\"\n",
"}\n",
" \n",
"