{ "cells": [ { "cell_type": "code", "execution_count": 44, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "heart_data = pd.read_csv('../heart_data.csv')" ] }, { "cell_type": "code", "execution_count": 45, "metadata": {}, "outputs": [], "source": [ "heart_data['HeartDisease'] = heart_data['HeartDisease']\n", "Kidney = heart_data['KidneyDisease']\n", "KidneyDisease = heart_data[heart_data['KidneyDisease']=='Yes']\n", "dont_have_KidneyDisease = heart_data[heart_data['KidneyDisease']=='No']\n" ] }, { "cell_type": "code", "execution_count": 46, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "count 319795\n", "unique 2\n", "top No\n", "freq 308016\n", "Name: KidneyDisease, dtype: object" ] }, "execution_count": 46, "metadata": {}, "output_type": "execute_result" } ], "source": [ "Kidney.describe()" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "KidneyDisease.describe()" ] }, { "cell_type": "code", "execution_count": 52, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Percentage of kidney patients that don't have heart disease 70.66813821207234\n", "Percentage of kidney patients that have heart disease 29.331861787927668\n" ] } ], "source": [ "print(\"Percentage of kidney patients that don't have heart disease\", 100 * KidneyDisease[KidneyDisease[\"HeartDisease\"] == \"No\"].size / KidneyDisease.size )\n", "print(\"Percentage of kidney patients that have heart disease\", 100 * KidneyDisease[KidneyDisease[\"HeartDisease\"] == \"Yes\"].size / KidneyDisease.size )" ] }, { "cell_type": "code", "execution_count": 55, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | BMI | \n", "PhysicalHealth | \n", "MentalHealth | \n", "SleepTime | \n", "
---|---|---|---|---|
count | \n", "308016.000000 | \n", "308016.000000 | \n", "308016.000000 | \n", "308016.000000 | \n", "
mean | \n", "28.262296 | \n", "3.150619 | \n", "3.840369 | \n", "7.095323 | \n", "
std | \n", "6.311631 | \n", "7.667615 | \n", "7.879449 | \n", "1.416586 | \n", "
min | \n", "12.020000 | \n", "0.000000 | \n", "0.000000 | \n", "1.000000 | \n", "
25% | \n", "23.960000 | \n", "0.000000 | \n", "0.000000 | \n", "6.000000 | \n", "
50% | \n", "27.270000 | \n", "0.000000 | \n", "0.000000 | \n", "7.000000 | \n", "
75% | \n", "31.320000 | \n", "1.000000 | \n", "3.000000 | \n", "8.000000 | \n", "
max | \n", "94.850000 | \n", "30.000000 | \n", "30.000000 | \n", "24.000000 | \n", "