{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "import warnings\n", "warnings.filterwarnings(\"ignore\")\n" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# 1. Wczytanie danych" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "X = pd.read_csv(\"../transformed_data/X_train.csv\")\n", "y = pd.read_csv(\"../transformed_data/y_train.csv\")" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Oxygen [Partial pressure] in Arterial blood | \n", "Total Bilirubin (Elevated) | \n", "Lymphocytes/100 leukocytes in Blood by Automated count | \n", "C reactive protein [Mass/volume] in Serum or Plasma | \n", "Basophils [#/volume] in Blood by Automated count | \n", "Prothrombin time (PT) | \n", "Platelet Count | \n", "Lymphocytes [#/volume] in Blood by Automated count | \n", "Carbon dioxide [Partial pressure] in Arterial blood | \n", "Eosinophils/100 leukocytes in Blood by Automated count | \n", "... | \n", "Ketones [Presence] in Urine by Test strip_2+ | \n", "Stage group.clinical Cancer_earlystage | \n", "Stage group.clinical Cancer_latestage | \n", "Smokes tobacco daily_True | \n", "SARS-CoV-2 RNA Pnl Resp NAA+probe_False | \n", "SARS-CoV-2 RNA Pnl Resp NAA+probe_True | \n", "Influenza virus A Ag [Presence] in Nasopharynx by Rapid immunoassay_False | \n", "Influenza virus A Ag [Presence] in Nasopharynx by Rapid immunoassay_True | \n", "Influenza virus B Ag [Presence] in Nasopharynx by Rapid immunoassay_False | \n", "Influenza virus B Ag [Presence] in Nasopharynx by Rapid immunoassay_True | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "48.94 | \n", "1.9 | \n", "15.19 | \n", "10.11 | \n", "0.3 | \n", "11.625 | \n", "304.1 | \n", "1.0 | \n", "40.11 | \n", "4.5 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
1 | \n", "48.94 | \n", "1.9 | \n", "15.19 | \n", "10.11 | \n", "0.3 | \n", "11.625 | \n", "304.1 | \n", "1.0 | \n", "40.11 | \n", "4.5 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
2 | \n", "48.94 | \n", "1.9 | \n", "15.19 | \n", "10.11 | \n", "0.3 | \n", "11.625 | \n", "304.1 | \n", "1.0 | \n", "40.11 | \n", "4.5 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
3 | \n", "48.94 | \n", "1.9 | \n", "15.19 | \n", "10.11 | \n", "0.3 | \n", "11.625 | \n", "304.1 | \n", "1.0 | \n", "40.11 | \n", "4.5 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
4 | \n", "48.94 | \n", "1.9 | \n", "15.19 | \n", "10.11 | \n", "0.3 | \n", "11.625 | \n", "304.1 | \n", "1.0 | \n", "40.11 | \n", "4.5 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
5 rows × 192 columns
\n", "