208 lines (207 with data), 36.0 kB
{
"cells": [
{
"attachments": {},
"cell_type": "markdown",
"metadata": {},
"source": [
"import the needed libiraries"
]
},
{
"cell_type": "code",
"execution_count": 31,
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd\n",
"import numpy as np\n",
"import matplotlib.pyplot as plt\n",
"import seaborn as sns\n",
"import scipy\n",
"from scipy import stats"
]
},
{
"attachments": {},
"cell_type": "markdown",
"metadata": {},
"source": [
"read the file and give it a name"
]
},
{
"cell_type": "code",
"execution_count": 32,
"metadata": {},
"outputs": [],
"source": [
"url = \"C:\\\\Users\\\\AOZ\\\\Desktop\\\\Statistics Project\\\\heart_data.csv\"\n",
"df = pd.read_csv(url)"
]
},
{
"attachments": {},
"cell_type": "markdown",
"metadata": {},
"source": [
"show info about all col"
]
},
{
"cell_type": "code",
"execution_count": 33,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"<class 'pandas.core.series.Series'>\n",
"RangeIndex: 319795 entries, 0 to 319794\n",
"Series name: AlcoholDrinking\n",
"Non-Null Count Dtype \n",
"-------------- ----- \n",
"319795 non-null object\n",
"dtypes: object(1)\n",
"memory usage: 2.4+ MB\n"
]
}
],
"source": [
"df['AlcoholDrinking'].info()"
]
},
{
"attachments": {},
"cell_type": "markdown",
"metadata": {},
"source": [
"descriptive stat of BMI"
]
},
{
"cell_type": "code",
"execution_count": 34,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"count 319795\n",
"unique 2\n",
"top No\n",
"freq 298018\n",
"Name: AlcoholDrinking, dtype: object"
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df['AlcoholDrinking'].describe(include=\"all\")"
]
},
{
"cell_type": "code",
"execution_count": 35,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"The percent of Drinkers that get heart diseases is 5.239472838315654\n"
]
},
{
"data": {
"image/png": "",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"Drinkers = df[df['AlcoholDrinking']=='Yes']\n",
"Drinkers['HeartDisease'].hist()\n",
"Drinkers_heart_disease = Drinkers[Drinkers['HeartDisease']=='Yes']\n",
"Drinkers__heart_disease = Drinkers[Drinkers['HeartDisease']=='No']\n",
"percent_of__Drinkers = Drinkers_heart_disease.size/Drinkers.size*100\n",
"print('The percent of Drinkers that get heart diseases is ',percent_of__Drinkers)"
]
},
{
"cell_type": "code",
"execution_count": 36,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"The percent of non-Drinkers that get heart diseases is 8.802152890093886\n"
]
},
{
"data": {
"image/png": "",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"nonDrinkers = df[df['AlcoholDrinking']=='No']\n",
"nonDrinkers['HeartDisease'].hist()\n",
"nonDrinkers_heart_disease = nonDrinkers[nonDrinkers['HeartDisease']=='Yes']\n",
"nonDrinkers__heart_disease = nonDrinkers[nonDrinkers['HeartDisease']=='No']\n",
"percent_of__nonDrinkers = nonDrinkers_heart_disease.size/nonDrinkers.size*100\n",
"print('The percent of non-Drinkers that get heart diseases is ',percent_of__nonDrinkers)"
]
},
{
"attachments": {},
"cell_type": "markdown",
"metadata": {},
"source": [
"thus, there is no relation between alcohol drinking and heart diseases"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.8"
},
"orig_nbformat": 4,
"vscode": {
"interpreter": {
"hash": "05c317967a6bcc6983b33dfc32d6a00017438325114854c9651b783a874b92d3"
}
}
},
"nbformat": 4,
"nbformat_minor": 2
}