--- a +++ b/1_simple_data.ipynb @@ -0,0 +1,33087 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "%matplotlib inline\n", + "from IPython.display import display, HTML" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Build Data Definitions" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import icu_data_defs" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>units</th>\n", + " <th>variable_type</th>\n", + " <th>clinical_source</th>\n", + " <th>list_id</th>\n", + " </tr>\n", + " <tr>\n", + " <th>def_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>heart rate</td>\n", + " <td>beats/min</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>blood pressure systolic</td>\n", + " <td>mmHg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>blood pressure diastolic</td>\n", + " <td>mmHg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>blood pressure mean</td>\n", + " <td>mmHg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>respiratory rate</td>\n", + " <td>insp/min</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label units variable_type clinical_source \\\n", + "def_id \n", + "0 heart rate beats/min qn observation \n", + "1 blood pressure systolic mmHg qn observation \n", + "2 blood pressure diastolic mmHg qn observation \n", + "3 blood pressure mean mmHg qn observation \n", + "4 respiratory rate insp/min qn observation \n", + "\n", + " list_id \n", + "def_id \n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN " + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_dict.tables.definitions.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "inr_id = data_dict.add_definition(label='INR')\n", + "pt_id = data_dict.add_definition(label='Prothrombin Time',units='seconds')" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>units</th>\n", + " <th>variable_type</th>\n", + " <th>clinical_source</th>\n", + " <th>list_id</th>\n", + " </tr>\n", + " <tr>\n", + " <th>def_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>23</th>\n", + " <td>lactate</td>\n", + " <td>mmol/L</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>24</th>\n", + " <td>lactate</td>\n", + " <td>mg/dL</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25</th>\n", + " <td>hemoglobin</td>\n", + " <td>g/dL</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>26</th>\n", + " <td>INR</td>\n", + " <td>NaN</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>27</th>\n", + " <td>Prothrombin Time</td>\n", + " <td>seconds</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label units variable_type clinical_source list_id\n", + "def_id \n", + "23 lactate mmol/L qn observation NaN\n", + "24 lactate mg/dL qn observation NaN\n", + "25 hemoglobin g/dL qn observation NaN\n", + "26 INR NaN qn observation NaN\n", + "27 Prothrombin Time seconds qn observation NaN" + ] + }, + "execution_count": 30, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_dict.tables.definitions.tail()" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>units</th>\n", + " <th>variable_type</th>\n", + " <th>clinical_source</th>\n", + " <th>list_id</th>\n", + " </tr>\n", + " <tr>\n", + " <th>def_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>26</th>\n", + " <td>INR</td>\n", + " <td>NaN</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>27</th>\n", + " <td>Prothrombin Time</td>\n", + " <td>seconds</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label units variable_type clinical_source list_id\n", + "def_id \n", + "26 INR NaN qn observation NaN\n", + "27 Prothrombin Time seconds qn observation NaN" + ] + }, + "execution_count": 31, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from itertools import product\n", + "\n", + "panel_map = list(product([data_dict.table_names.definitions],[inr_id,pt_id]))\n", + "panel_id = data_dict.add_panel('coagulation labs',panel_map)\n", + "data_dict.get_panel_defintions(panel_id)" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>panel_name</th>\n", + " <th>list_id</th>\n", + " </tr>\n", + " <tr>\n", + " <th>panel_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>blood pressure</td>\n", + " <td>3</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>vital signs</td>\n", + " <td>4</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>urine output</td>\n", + " <td>5</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>glasgow coma scale</td>\n", + " <td>6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>normal saline</td>\n", + " <td>7</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>lactated ringers</td>\n", + " <td>8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>common fluids</td>\n", + " <td>9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7</th>\n", + " <td>norepinephrine</td>\n", + " <td>10</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8</th>\n", + " <td>vasopressin</td>\n", + " <td>11</td>\n", + " </tr>\n", + " <tr>\n", + " <th>9</th>\n", + " <td>common pressors</td>\n", + " <td>12</td>\n", + " </tr>\n", + " <tr>\n", + " <th>10</th>\n", + " <td>lactate</td>\n", + " <td>13</td>\n", + " </tr>\n", + " <tr>\n", + " <th>11</th>\n", + " <td>oxygen delivery labs</td>\n", + " <td>14</td>\n", + " </tr>\n", + " <tr>\n", + " <th>12</th>\n", + " <td>simple dataset</td>\n", + " <td>15</td>\n", + " </tr>\n", + " <tr>\n", + " <th>13</th>\n", + " <td>coagulation labs</td>\n", + " <td>16</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " panel_name list_id\n", + "panel_id \n", + "0 blood pressure 3\n", + "1 vital signs 4\n", + "2 urine output 5\n", + "3 glasgow coma scale 6\n", + "4 normal saline 7\n", + "5 lactated ringers 8\n", + "6 common fluids 9\n", + "7 norepinephrine 10\n", + "8 vasopressin 11\n", + "9 common pressors 12\n", + "10 lactate 13\n", + "11 oxygen delivery labs 14\n", + "12 simple dataset 15\n", + "13 coagulation labs 16" + ] + }, + "execution_count": 32, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_dict.tables.panels" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>units</th>\n", + " <th>variable_type</th>\n", + " <th>clinical_source</th>\n", + " <th>list_id</th>\n", + " </tr>\n", + " <tr>\n", + " <th>def_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>heart rate</td>\n", + " <td>beats/min</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>blood pressure systolic</td>\n", + " <td>mmHg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>blood pressure diastolic</td>\n", + " <td>mmHg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>blood pressure mean</td>\n", + " <td>mmHg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>respiratory rate</td>\n", + " <td>insp/min</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>temperature body</td>\n", + " <td>degF</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>oxygen saturation pulse oximetry</td>\n", + " <td>percent</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7</th>\n", + " <td>weight body</td>\n", + " <td>kg</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8</th>\n", + " <td>output urine</td>\n", + " <td>mL</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>9</th>\n", + " <td>output urine</td>\n", + " <td>mL/hr</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>10</th>\n", + " <td>output urine</td>\n", + " <td>mL/kg/hr</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>11</th>\n", + " <td>glasgow coma scale motor</td>\n", + " <td>NaN</td>\n", + " <td>ord</td>\n", + " <td>observation</td>\n", + " <td>0.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>12</th>\n", + " <td>glasgow coma scale eye opening</td>\n", + " <td>NaN</td>\n", + " <td>ord</td>\n", + " <td>observation</td>\n", + " <td>2.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>13</th>\n", + " <td>glasgow coma scale verbal</td>\n", + " <td>NaN</td>\n", + " <td>ord</td>\n", + " <td>observation</td>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>14</th>\n", + " <td>normal saline</td>\n", + " <td>mL</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>15</th>\n", + " <td>normal saline</td>\n", + " <td>mL/hr</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>16</th>\n", + " <td>lactated ringers</td>\n", + " <td>mL</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>17</th>\n", + " <td>lactated ringers</td>\n", + " <td>mL/hr</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>18</th>\n", + " <td>norepinephrine</td>\n", + " <td>mcg</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>19</th>\n", + " <td>norepinephrine</td>\n", + " <td>mcg/min</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>20</th>\n", + " <td>norepinephrine</td>\n", + " <td>mcg/kg/min</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>21</th>\n", + " <td>vasopressin</td>\n", + " <td>units</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>22</th>\n", + " <td>vasopressin</td>\n", + " <td>units/min</td>\n", + " <td>qn</td>\n", + " <td>intervention</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25</th>\n", + " <td>hemoglobin</td>\n", + " <td>g/dL</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>23</th>\n", + " <td>lactate</td>\n", + " <td>mmol/L</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>24</th>\n", + " <td>lactate</td>\n", + " <td>mg/dL</td>\n", + " <td>qn</td>\n", + " <td>observation</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label units variable_type \\\n", + "def_id \n", + "0 heart rate beats/min qn \n", + "1 blood pressure systolic mmHg qn \n", + "2 blood pressure diastolic mmHg qn \n", + "3 blood pressure mean mmHg qn \n", + "4 respiratory rate insp/min qn \n", + "5 temperature body degF qn \n", + "6 oxygen saturation pulse oximetry percent qn \n", + "7 weight body kg qn \n", + "8 output urine mL qn \n", + "9 output urine mL/hr qn \n", + "10 output urine mL/kg/hr qn \n", + "11 glasgow coma scale motor NaN ord \n", + "12 glasgow coma scale eye opening NaN ord \n", + "13 glasgow coma scale verbal NaN ord \n", + "14 normal saline mL qn \n", + "15 normal saline mL/hr qn \n", + "16 lactated ringers mL qn \n", + "17 lactated ringers mL/hr qn \n", + "18 norepinephrine mcg qn \n", + "19 norepinephrine mcg/min qn \n", + "20 norepinephrine mcg/kg/min qn \n", + "21 vasopressin units qn \n", + "22 vasopressin units/min qn \n", + "25 hemoglobin g/dL qn \n", + "23 lactate mmol/L qn \n", + "24 lactate mg/dL qn \n", + "\n", + " clinical_source list_id \n", + "def_id \n", + "0 observation NaN \n", + "1 observation NaN \n", + "2 observation NaN \n", + "3 observation NaN \n", + "4 observation NaN \n", + "5 observation NaN \n", + "6 observation NaN \n", + "7 observation NaN \n", + "8 observation NaN \n", + "9 observation NaN \n", + "10 observation NaN \n", + "11 observation 0.0 \n", + "12 observation 2.0 \n", + "13 observation 1.0 \n", + "14 intervention NaN \n", + "15 intervention NaN \n", + "16 intervention NaN \n", + "17 intervention NaN \n", + "18 intervention NaN \n", + "19 intervention NaN \n", + "20 intervention NaN \n", + "21 intervention NaN \n", + "22 intervention NaN \n", + "25 observation NaN \n", + "23 observation NaN \n", + "24 observation NaN " + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_dict.get_panel_defintions(12)" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "data_dict.save()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# MIMIC Exploration" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import mimic\n", + "from icu_data_defs import data_dictionary" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "reload(mimic)\n", + "conn = mimic.connect()\n", + "data_dict = data_dictionary('config/data_definitions.xlsx')\n", + "explorer = mimic.explorer(conn)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "keep_dict = {}" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Vital Signs" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Heart Rate" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>227018</th>\n", + " <td>HR_ApacheIV</td>\n", + " <td>HR_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223765</th>\n", + " <td>Orthostatic HR sitting</td>\n", + " <td>Orthostatic HR sitting</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1332</th>\n", + " <td>pulse</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227581</th>\n", + " <td>BiPap bpm (S/T -Back up)</td>\n", + " <td>BiPap bpm (S/T -Back up)</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220047</th>\n", + " <td>Heart Rate Alarm - Low</td>\n", + " <td>HR Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224363</th>\n", + " <td>VAD Beat Rate L</td>\n", + " <td>VAD Beat Rate L</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226764</th>\n", + " <td>HrApacheIIValue</td>\n", + " <td>HrApacheIIValue</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1341</th>\n", + " <td>PULSE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220045</th>\n", + " <td>Heart Rate</td>\n", + " <td>HR</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223775</th>\n", + " <td>VAD Beat Rate R</td>\n", + " <td>VAD Beat Rate R</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220046</th>\n", + " <td>Heart rate Alarm - High</td>\n", + " <td>HR Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224751</th>\n", + " <td>Temporary Pacemaker Rate</td>\n", + " <td>Temp Pacemaker Rate</td>\n", + " <td>chartevents</td>\n", + " <td>Cardiovascular (Pacer Data)</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223764</th>\n", + " <td>Orthostatic HR lying</td>\n", + " <td>Orthostatic HR lying</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1725</th>\n", + " <td>Pulse</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224422</th>\n", + " <td>Spont RR</td>\n", + " <td>Spont RR</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224647</th>\n", + " <td>Orthostatic HR standing</td>\n", + " <td>Orthostatic HR standing</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>bpm</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>211</th>\n", + " <td>Heart Rate</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220181</th>\n", + " <td>Non Invasive Blood Pressure mean</td>\n", + " <td>NBPm</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220052</th>\n", + " <td>Arterial Blood Pressure mean</td>\n", + " <td>ABPm</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3494</th>\n", + " <td>Lowest Heart Rate</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>92.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "227018 HR_ApacheIV HR_ApacheIV \n", + "223765 Orthostatic HR sitting Orthostatic HR sitting \n", + "1332 pulse \n", + "227581 BiPap bpm (S/T -Back up) BiPap bpm (S/T -Back up) \n", + "220047 Heart Rate Alarm - Low HR Alarm - Low \n", + "224363 VAD Beat Rate L VAD Beat Rate L \n", + "226764 HrApacheIIValue HrApacheIIValue \n", + "1341 PULSE \n", + "220045 Heart Rate HR \n", + "223775 VAD Beat Rate R VAD Beat Rate R \n", + "220046 Heart rate Alarm - High HR Alarm - High \n", + "224751 Temporary Pacemaker Rate Temp Pacemaker Rate \n", + "223764 Orthostatic HR lying Orthostatic HR lying \n", + "1725 Pulse \n", + "224422 Spont RR Spont RR \n", + "224647 Orthostatic HR standing Orthostatic HR standing \n", + "211 Heart Rate \n", + "220181 Non Invasive Blood Pressure mean NBPm \n", + "220052 Arterial Blood Pressure mean ABPm \n", + "3494 Lowest Heart Rate \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "227018 chartevents Scores - APACHE IV (2) bpm 110.000000 \n", + "223765 chartevents Routine Vital Signs bpm 110.000000 \n", + "1332 chartevents 110.000000 \n", + "227581 chartevents Respiratory bpm 110.000000 \n", + "220047 chartevents Alarms bpm 110.000000 \n", + "224363 chartevents Hemodynamics bpm 110.000000 \n", + "226764 chartevents Scores - APACHE II bpm 110.000000 \n", + "1341 chartevents 110.000000 \n", + "220045 chartevents Routine Vital Signs bpm 110.000000 \n", + "223775 chartevents Hemodynamics bpm 110.000000 \n", + "220046 chartevents Alarms bpm 110.000000 \n", + "224751 chartevents Cardiovascular (Pacer Data) bpm 110.000000 \n", + "223764 chartevents Routine Vital Signs bpm 110.000000 \n", + "1725 chartevents 110.000000 \n", + "224422 chartevents Respiratory bpm 110.000000 \n", + "224647 chartevents Routine Vital Signs bpm 110.000000 \n", + "211 chartevents 110.000000 \n", + "220181 chartevents Routine Vital Signs mmHg 100.666667 \n", + "220052 chartevents Routine Vital Signs mmHg 100.666667 \n", + "3494 chartevents 92.666667 " + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'heart rate',\n", + " 'beats',\n", + " 'bpm',\n", + " 'pulse'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "label = data_dict.labels.HEART_RATE\n", + "keep_dict[label] = [211,220045,1341,1725,1332]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Respiratory Rate" + ] + }, + { + "cell_type": "code", + "execution_count": 66, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>3603</th>\n", + " <td>Resp Rate</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224688</th>\n", + " <td>Respiratory Rate (Set)</td>\n", + " <td>Respiratory Rate (Set)</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226774</th>\n", + " <td>RRApacheIIValue</td>\n", + " <td>RRApacheIIValue</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>618</th>\n", + " <td>Respiratory Rate</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224690</th>\n", + " <td>Respiratory Rate (Total)</td>\n", + " <td>Respiratory Rate (Total)</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223875</th>\n", + " <td>Fspn High</td>\n", + " <td>Fspn High</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224689</th>\n", + " <td>Respiratory Rate (spontaneous)</td>\n", + " <td>Respiratory Rate (spontaneous)</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220210</th>\n", + " <td>Respiratory Rate</td>\n", + " <td>RR</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224161</th>\n", + " <td>Resp Alarm - High</td>\n", + " <td>Resp Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227050</th>\n", + " <td>RR_ApacheIV</td>\n", + " <td>RR_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224162</th>\n", + " <td>Resp Alarm - Low</td>\n", + " <td>Resp Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>insp/min</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>619</th>\n", + " <td>Respiratory Rate Set</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>102.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225949</th>\n", + " <td>NIV Mask</td>\n", + " <td>NIV Mask</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223840</th>\n", + " <td>ETT Re-taped</td>\n", + " <td>ETT Re-taped</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223838</th>\n", + " <td>ETT Location</td>\n", + " <td>ETT Location</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223837</th>\n", + " <td>ETT Size (ID)</td>\n", + " <td>ETT Size (ID)</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224373</th>\n", + " <td>Sputum Amount</td>\n", + " <td>Sputum Amount</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223836</th>\n", + " <td>Airway Type</td>\n", + " <td>Airway Type</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226815</th>\n", + " <td>Airway problems</td>\n", + " <td>Airway problems</td>\n", + " <td></td>\n", + " <td>Respiratory</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223835</th>\n", + " <td>Inspired O2 Fraction</td>\n", + " <td>FiO2</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>None</td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "3603 Resp Rate \n", + "224688 Respiratory Rate (Set) Respiratory Rate (Set) \n", + "226774 RRApacheIIValue RRApacheIIValue \n", + "618 Respiratory Rate \n", + "224690 Respiratory Rate (Total) Respiratory Rate (Total) \n", + "223875 Fspn High Fspn High \n", + "224689 Respiratory Rate (spontaneous) Respiratory Rate (spontaneous) \n", + "220210 Respiratory Rate RR \n", + "224161 Resp Alarm - High Resp Alarm - High \n", + "227050 RR_ApacheIV RR_ApacheIV \n", + "224162 Resp Alarm - Low Resp Alarm - Low \n", + "619 Respiratory Rate Set \n", + "225949 NIV Mask NIV Mask \n", + "223840 ETT Re-taped ETT Re-taped \n", + "223838 ETT Location ETT Location \n", + "223837 ETT Size (ID) ETT Size (ID) \n", + "224373 Sputum Amount Sputum Amount \n", + "223836 Airway Type Airway Type \n", + "226815 Airway problems Airway problems \n", + "223835 Inspired O2 Fraction FiO2 \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "3603 chartevents 110.000000 \n", + "224688 chartevents Respiratory insp/min 110.000000 \n", + "226774 chartevents Scores - APACHE II insp/min 110.000000 \n", + "618 chartevents 110.000000 \n", + "224690 chartevents Respiratory insp/min 110.000000 \n", + "223875 chartevents Respiratory insp/min 110.000000 \n", + "224689 chartevents Respiratory insp/min 110.000000 \n", + "220210 chartevents Respiratory insp/min 110.000000 \n", + "224161 chartevents Alarms insp/min 110.000000 \n", + "227050 chartevents Scores - APACHE IV (2) insp/min 110.000000 \n", + "224162 chartevents Alarms insp/min 110.000000 \n", + "619 chartevents 102.666667 \n", + "225949 Respiratory 97.333333 \n", + "223840 Respiratory 97.333333 \n", + "223838 Respiratory 97.333333 \n", + "223837 Respiratory 97.333333 \n", + "224373 Respiratory 97.333333 \n", + "223836 Respiratory 97.333333 \n", + "226815 Respiratory 97.333333 \n", + "223835 chartevents Respiratory None 97.333333 " + ] + }, + "execution_count": 66, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'respiratory rate',\n", + " 'resp rate',\n", + " 'insp/min',\n", + " 'breath/min'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 67, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "label = data_dict.labels.RESPIRATORY_RATE\n", + "keep_dict[label] = [220210,3603,618,8113,615,219]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Blood Pressure" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>224315</th>\n", + " <td>ABI Brachial BP L</td>\n", + " <td>ABI Brachial BP L</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227537</th>\n", + " <td>ART Blood Pressure Alarm - High</td>\n", + " <td>ART BP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220181</th>\n", + " <td>Non Invasive Blood Pressure mean</td>\n", + " <td>NBPm</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220180</th>\n", + " <td>Non Invasive Blood Pressure diastolic</td>\n", + " <td>NBPd</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220179</th>\n", + " <td>Non Invasive Blood Pressure systolic</td>\n", + " <td>NBPs</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220074</th>\n", + " <td>Central Venous Pressure</td>\n", + " <td>CVP</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220073</th>\n", + " <td>Central Venous Pressure Alarm - Low</td>\n", + " <td>CVP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220072</th>\n", + " <td>Central Venous Pressure Alarm - High</td>\n", + " <td>CVP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220069</th>\n", + " <td>Left Artrial Pressure</td>\n", + " <td>LAP</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220066</th>\n", + " <td>Pulmonary Artery Pressure Alarm - Low</td>\n", + " <td>PAP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220063</th>\n", + " <td>Pulmonary Artery Pressure Alarm - High</td>\n", + " <td>PAP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220061</th>\n", + " <td>Pulmonary Artery Pressure mean</td>\n", + " <td>PAPm</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220060</th>\n", + " <td>Pulmonary Artery Pressure diastolic</td>\n", + " <td>PAPd</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220059</th>\n", + " <td>Pulmonary Artery Pressure systolic</td>\n", + " <td>PAPs</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220058</th>\n", + " <td>Arterial Blood Pressure Alarm - High</td>\n", + " <td>ABP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227538</th>\n", + " <td>ART Blood Pressure Alarm - Low</td>\n", + " <td>ART BP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226096</th>\n", + " <td>Orthostatic BPd standing</td>\n", + " <td>Orthostatic BPd standing</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224152</th>\n", + " <td>Return Pressure</td>\n", + " <td>Return Pressure</td>\n", + " <td>chartevents</td>\n", + " <td>Dialysis</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227066</th>\n", + " <td>Cerebral Perfusion Pressure</td>\n", + " <td>CPP</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226062</th>\n", + " <td>Venous CO2 Pressure</td>\n", + " <td>PCO2 (Venous)</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "224315 ABI Brachial BP L ABI Brachial BP L \n", + "227537 ART Blood Pressure Alarm - High ART BP Alarm - High \n", + "220181 Non Invasive Blood Pressure mean NBPm \n", + "220180 Non Invasive Blood Pressure diastolic NBPd \n", + "220179 Non Invasive Blood Pressure systolic NBPs \n", + "220074 Central Venous Pressure CVP \n", + "220073 Central Venous Pressure Alarm - Low CVP Alarm - Low \n", + "220072 Central Venous Pressure Alarm - High CVP Alarm - High \n", + "220069 Left Artrial Pressure LAP \n", + "220066 Pulmonary Artery Pressure Alarm - Low PAP Alarm - Low \n", + "220063 Pulmonary Artery Pressure Alarm - High PAP Alarm - High \n", + "220061 Pulmonary Artery Pressure mean PAPm \n", + "220060 Pulmonary Artery Pressure diastolic PAPd \n", + "220059 Pulmonary Artery Pressure systolic PAPs \n", + "220058 Arterial Blood Pressure Alarm - High ABP Alarm - High \n", + "227538 ART Blood Pressure Alarm - Low ART BP Alarm - Low \n", + "226096 Orthostatic BPd standing Orthostatic BPd standing \n", + "224152 Return Pressure Return Pressure \n", + "227066 Cerebral Perfusion Pressure CPP \n", + "226062 Venous CO2 Pressure PCO2 (Venous) \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "224315 chartevents IABP mmHg 110.0 \n", + "227537 chartevents Alarms mmHg 110.0 \n", + "220181 chartevents Routine Vital Signs mmHg 110.0 \n", + "220180 chartevents Routine Vital Signs mmHg 110.0 \n", + "220179 chartevents Routine Vital Signs mmHg 110.0 \n", + "220074 chartevents Hemodynamics mmHg 110.0 \n", + "220073 chartevents Alarms mmHg 110.0 \n", + "220072 chartevents Alarms mmHg 110.0 \n", + "220069 chartevents Hemodynamics mmHg 110.0 \n", + "220066 chartevents Alarms mmHg 110.0 \n", + "220063 chartevents Alarms mmHg 110.0 \n", + "220061 chartevents Hemodynamics mmHg 110.0 \n", + "220060 chartevents Hemodynamics mmHg 110.0 \n", + "220059 chartevents Hemodynamics mmHg 110.0 \n", + "220058 chartevents Alarms mmHg 110.0 \n", + "227538 chartevents Alarms mmHg 110.0 \n", + "226096 chartevents Routine Vital Signs mmHg 110.0 \n", + "224152 chartevents Dialysis mmHg 110.0 \n", + "227066 chartevents Hemodynamics mmHg 110.0 \n", + "226062 chartevents Labs mmHg 110.0 " + ] + }, + "execution_count": 68, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'blood pressure',\n", + " 'systolic',\n", + " 'diastolic',\n", + " 'mmHg'\n", + " ])\n", + "out_df.iloc[0:20]" + ] + }, + { + "cell_type": "code", + "execution_count": 69, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>226063</th>\n", + " <td>Venous O2 Pressure</td>\n", + " <td>PO2 (Venous)</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225312</th>\n", + " <td>ART BP mean</td>\n", + " <td>ART BP mean</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225310</th>\n", + " <td>ART BP Diastolic</td>\n", + " <td>ART BP Diastolic</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225309</th>\n", + " <td>ART BP Systolic</td>\n", + " <td>ART BP Systolic</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223751</th>\n", + " <td>Non-Invasive Blood Pressure Alarm - High</td>\n", + " <td>NBP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227516</th>\n", + " <td>PO2 (Mixed Venous)</td>\n", + " <td>PO2 (Mixed Venous)</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224166</th>\n", + " <td>Doppler BP</td>\n", + " <td>Doppler BP</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224167</th>\n", + " <td>Manual Blood Pressure Systolic Left</td>\n", + " <td>Manual BPs L</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226737</th>\n", + " <td>AaDO2ApacheIIValue</td>\n", + " <td>AaDO2ApacheIIValue</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228148</th>\n", + " <td>ABI Ankle BP R (Impella)</td>\n", + " <td>ABI Ankle BP R (Impella)</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220224</th>\n", + " <td>Arterial O2 pressure</td>\n", + " <td>PO2 (Arterial)</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220235</th>\n", + " <td>Arterial CO2 Pressure</td>\n", + " <td>PCO2 (Arterial)</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223752</th>\n", + " <td>Non-Invasive Blood Pressure Alarm - Low</td>\n", + " <td>NBP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223763</th>\n", + " <td>Bladder Pressure</td>\n", + " <td>Bladder Pressure</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224150</th>\n", + " <td>Filter Pressure</td>\n", + " <td>Filter Pressure</td>\n", + " <td>chartevents</td>\n", + " <td>Dialysis</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224149</th>\n", + " <td>Access Pressure</td>\n", + " <td>Access Pressure</td>\n", + " <td>chartevents</td>\n", + " <td>Dialysis</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227991</th>\n", + " <td>Intra Cranial Pressure #2 Alarm - Low</td>\n", + " <td>IC2 Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226094</th>\n", + " <td>Orthostatic BPd sitting</td>\n", + " <td>Orthostatic BPd sitting</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226092</th>\n", + " <td>Orthostatic BPd lying</td>\n", + " <td>Orthostatic BPd lying</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227990</th>\n", + " <td>Intra Cranial Pressure #2 Alarm - High</td>\n", + " <td>IC2 Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "226063 Venous O2 Pressure PO2 (Venous) \n", + "225312 ART BP mean ART BP mean \n", + "225310 ART BP Diastolic ART BP Diastolic \n", + "225309 ART BP Systolic ART BP Systolic \n", + "223751 Non-Invasive Blood Pressure Alarm - High NBP Alarm - High \n", + "227516 PO2 (Mixed Venous) PO2 (Mixed Venous) \n", + "224166 Doppler BP Doppler BP \n", + "224167 Manual Blood Pressure Systolic Left Manual BPs L \n", + "226737 AaDO2ApacheIIValue AaDO2ApacheIIValue \n", + "228148 ABI Ankle BP R (Impella) ABI Ankle BP R (Impella) \n", + "220224 Arterial O2 pressure PO2 (Arterial) \n", + "220235 Arterial CO2 Pressure PCO2 (Arterial) \n", + "223752 Non-Invasive Blood Pressure Alarm - Low NBP Alarm - Low \n", + "223763 Bladder Pressure Bladder Pressure \n", + "224150 Filter Pressure Filter Pressure \n", + "224149 Access Pressure Access Pressure \n", + "227991 Intra Cranial Pressure #2 Alarm - Low IC2 Alarm - Low \n", + "226094 Orthostatic BPd sitting Orthostatic BPd sitting \n", + "226092 Orthostatic BPd lying Orthostatic BPd lying \n", + "227990 Intra Cranial Pressure #2 Alarm - High IC2 Alarm - High \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "226063 chartevents Labs mmHg 110.0 \n", + "225312 chartevents Routine Vital Signs mmHg 110.0 \n", + "225310 chartevents Routine Vital Signs mmHg 110.0 \n", + "225309 chartevents Routine Vital Signs mmHg 110.0 \n", + "223751 chartevents Alarms mmHg 110.0 \n", + "227516 chartevents Labs mmHg 110.0 \n", + "224166 chartevents Routine Vital Signs mmHg 110.0 \n", + "224167 chartevents Routine Vital Signs mmHg 110.0 \n", + "226737 chartevents Scores - APACHE II mmHg 110.0 \n", + "228148 chartevents Impella mmHg 110.0 \n", + "220224 chartevents Labs mmHg 110.0 \n", + "220235 chartevents Labs mmHg 110.0 \n", + "223752 chartevents Alarms mmHg 110.0 \n", + "223763 chartevents Routine Vital Signs mmHg 110.0 \n", + "224150 chartevents Dialysis mmHg 110.0 \n", + "224149 chartevents Dialysis mmHg 110.0 \n", + "227991 chartevents Alarms mmHg 110.0 \n", + "226094 chartevents Routine Vital Signs mmHg 110.0 \n", + "226092 chartevents Routine Vital Signs mmHg 110.0 \n", + "227990 chartevents Alarms mmHg 110.0 " + ] + }, + "execution_count": 69, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] = [220179]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] = [220180]\n", + "out_df.iloc[20:40]" + ] + }, + { + "cell_type": "code", + "execution_count": 70, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>227989</th>\n", + " <td>Intra Cranial Pressure #2</td>\n", + " <td>IC2</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220056</th>\n", + " <td>Arterial Blood Pressure Alarm - Low</td>\n", + " <td>ABP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220052</th>\n", + " <td>Arterial Blood Pressure mean</td>\n", + " <td>ABPm</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220051</th>\n", + " <td>Arterial Blood Pressure diastolic</td>\n", + " <td>ABPd</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220050</th>\n", + " <td>Arterial Blood Pressure systolic</td>\n", + " <td>ABPs</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228145</th>\n", + " <td>ABI Ankle BP L</td>\n", + " <td>ABI Ankle BP L</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228146</th>\n", + " <td>ABI Brachial BP R</td>\n", + " <td>ABI Brachial BP R</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227039</th>\n", + " <td>PO2_ApacheIV</td>\n", + " <td>PO2_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220765</th>\n", + " <td>Intra Cranial Pressure</td>\n", + " <td>ICP</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227023</th>\n", + " <td>MAP_ApacheIV</td>\n", + " <td>MAP_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224309</th>\n", + " <td>Assisted Systole</td>\n", + " <td>SYS - Assisted</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224310</th>\n", + " <td>Augmented Diastole</td>\n", + " <td>AUG</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224311</th>\n", + " <td>BAEDP</td>\n", + " <td>DIA - Assisted</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224314</th>\n", + " <td>ABI Brachial BP R (Impella)</td>\n", + " <td>ABI Brachial BP R (Impella)</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224317</th>\n", + " <td>ABI Ankle BP R</td>\n", + " <td>ABI Ankle BP R</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224318</th>\n", + " <td>ABI Ankle BP L (Impella)</td>\n", + " <td>ABI Ankle BP L (Impella)</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224322</th>\n", + " <td>IABP Mean</td>\n", + " <td>MAP - Assisted</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223771</th>\n", + " <td>PCWP</td>\n", + " <td>PCWP</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223768</th>\n", + " <td>Intra Cranial Pressure Alarm - Low</td>\n", + " <td>ICP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223767</th>\n", + " <td>Intra Cranial Pressure Alarm - High</td>\n", + " <td>ICP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "227989 Intra Cranial Pressure #2 IC2 \n", + "220056 Arterial Blood Pressure Alarm - Low ABP Alarm - Low \n", + "220052 Arterial Blood Pressure mean ABPm \n", + "220051 Arterial Blood Pressure diastolic ABPd \n", + "220050 Arterial Blood Pressure systolic ABPs \n", + "228145 ABI Ankle BP L ABI Ankle BP L \n", + "228146 ABI Brachial BP R ABI Brachial BP R \n", + "227039 PO2_ApacheIV PO2_ApacheIV \n", + "220765 Intra Cranial Pressure ICP \n", + "227023 MAP_ApacheIV MAP_ApacheIV \n", + "224309 Assisted Systole SYS - Assisted \n", + "224310 Augmented Diastole AUG \n", + "224311 BAEDP DIA - Assisted \n", + "224314 ABI Brachial BP R (Impella) ABI Brachial BP R (Impella) \n", + "224317 ABI Ankle BP R ABI Ankle BP R \n", + "224318 ABI Ankle BP L (Impella) ABI Ankle BP L (Impella) \n", + "224322 IABP Mean MAP - Assisted \n", + "223771 PCWP PCWP \n", + "223768 Intra Cranial Pressure Alarm - Low ICP Alarm - Low \n", + "223767 Intra Cranial Pressure Alarm - High ICP Alarm - High \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "227989 chartevents Hemodynamics mmHg 110.0 \n", + "220056 chartevents Alarms mmHg 110.0 \n", + "220052 chartevents Routine Vital Signs mmHg 110.0 \n", + "220051 chartevents Routine Vital Signs mmHg 110.0 \n", + "220050 chartevents Routine Vital Signs mmHg 110.0 \n", + "228145 chartevents IABP mmHg 110.0 \n", + "228146 chartevents IABP mmHg 110.0 \n", + "227039 chartevents Scores - APACHE IV (2) mmHg 110.0 \n", + "220765 chartevents Hemodynamics mmHg 110.0 \n", + "227023 chartevents Scores - APACHE IV (2) mmHg 110.0 \n", + "224309 chartevents IABP mmHg 110.0 \n", + "224310 chartevents IABP mmHg 110.0 \n", + "224311 chartevents IABP mmHg 110.0 \n", + "224314 chartevents Impella mmHg 110.0 \n", + "224317 chartevents IABP mmHg 110.0 \n", + "224318 chartevents Impella mmHg 110.0 \n", + "224322 chartevents IABP mmHg 110.0 \n", + "223771 chartevents Hemodynamics mmHg 110.0 \n", + "223768 chartevents Alarms mmHg 110.0 \n", + "223767 chartevents Alarms mmHg 110.0 " + ] + }, + "execution_count": 70, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [225309,224167]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [225310,224643]\n", + "out_df.iloc[40:60]" + ] + }, + { + "cell_type": "code", + "execution_count": 71, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>223766</th>\n", + " <td>Orthostatic BPs standing</td>\n", + " <td>Orthostatic BPs standing</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228149</th>\n", + " <td>ABI Brachial BP L (Impella)</td>\n", + " <td>ABI Brachial BP L (Impella)</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224151</th>\n", + " <td>Effluent Pressure</td>\n", + " <td>Effluent Pressure</td>\n", + " <td>chartevents</td>\n", + " <td>Dialysis</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224643</th>\n", + " <td>Manual Blood Pressure Diastolic Left</td>\n", + " <td>Manual BPd L</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224654</th>\n", + " <td>PAEDP</td>\n", + " <td>DIA - Unassisted</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226855</th>\n", + " <td>PCWP (mean) (PA Line)</td>\n", + " <td>PCWP (mean) (PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226857</th>\n", + " <td>PA mean pressure (PA Line)</td>\n", + " <td>PA mean pressure (PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224646</th>\n", + " <td>Orthostatic BPs sitting</td>\n", + " <td>Orthostatic BPs sitting</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227716</th>\n", + " <td>Cerebral Perfusion Pressure Alarm - High</td>\n", + " <td>CPP Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227717</th>\n", + " <td>Cerebral Perfusion Pressure Alarm - Low</td>\n", + " <td>CPP Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224645</th>\n", + " <td>Orthostatic BPs lying</td>\n", + " <td>Orthostatic BPs lying</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227242</th>\n", + " <td>Manual Blood Pressure Diastolic Right</td>\n", + " <td>Manual BPd R</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226766</th>\n", + " <td>MapApacheIIValue</td>\n", + " <td>MapApacheIIValue</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227243</th>\n", + " <td>Manual Blood Pressure Systolic Right</td>\n", + " <td>Manual BPs R</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226853</th>\n", + " <td>PA diastolic pressure(PA Line)</td>\n", + " <td>PA diastolic pressure(PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226849</th>\n", + " <td>RA (mean) pressure (PA Line)</td>\n", + " <td>RA (mean) pressure (PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226850</th>\n", + " <td>RV systolic pressure(PA Line)</td>\n", + " <td>RV systolic pressure(PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226851</th>\n", + " <td>RV diastolic pressure(PA Line)</td>\n", + " <td>RV diastolic pressure(PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224659</th>\n", + " <td>Vacuum Assist</td>\n", + " <td>Vacuum Assist</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226854</th>\n", + " <td>PCWP (v wave) (PA Line)</td>\n", + " <td>PCWP (v wave) (PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label \\\n", + "itemid \n", + "223766 Orthostatic BPs standing \n", + "228149 ABI Brachial BP L (Impella) \n", + "224151 Effluent Pressure \n", + "224643 Manual Blood Pressure Diastolic Left \n", + "224654 PAEDP \n", + "226855 PCWP (mean) (PA Line) \n", + "226857 PA mean pressure (PA Line) \n", + "224646 Orthostatic BPs sitting \n", + "227716 Cerebral Perfusion Pressure Alarm - High \n", + "227717 Cerebral Perfusion Pressure Alarm - Low \n", + "224645 Orthostatic BPs lying \n", + "227242 Manual Blood Pressure Diastolic Right \n", + "226766 MapApacheIIValue \n", + "227243 Manual Blood Pressure Systolic Right \n", + "226853 PA diastolic pressure(PA Line) \n", + "226849 RA (mean) pressure (PA Line) \n", + "226850 RV systolic pressure(PA Line) \n", + "226851 RV diastolic pressure(PA Line) \n", + "224659 Vacuum Assist \n", + "226854 PCWP (v wave) (PA Line) \n", + "\n", + " abbreviation linksto category \\\n", + "itemid \n", + "223766 Orthostatic BPs standing chartevents Routine Vital Signs \n", + "228149 ABI Brachial BP L (Impella) chartevents Impella \n", + "224151 Effluent Pressure chartevents Dialysis \n", + "224643 Manual BPd L chartevents Routine Vital Signs \n", + "224654 DIA - Unassisted chartevents IABP \n", + "226855 PCWP (mean) (PA Line) chartevents PA Line Insertion \n", + "226857 PA mean pressure (PA Line) chartevents PA Line Insertion \n", + "224646 Orthostatic BPs sitting chartevents Routine Vital Signs \n", + "227716 CPP Alarm - High chartevents Alarms \n", + "227717 CPP Alarm - Low chartevents Alarms \n", + "224645 Orthostatic BPs lying chartevents Routine Vital Signs \n", + "227242 Manual BPd R chartevents Routine Vital Signs \n", + "226766 MapApacheIIValue chartevents Scores - APACHE II \n", + "227243 Manual BPs R chartevents Routine Vital Signs \n", + "226853 PA diastolic pressure(PA Line) chartevents PA Line Insertion \n", + "226849 RA (mean) pressure (PA Line) chartevents PA Line Insertion \n", + "226850 RV systolic pressure(PA Line) chartevents PA Line Insertion \n", + "226851 RV diastolic pressure(PA Line) chartevents PA Line Insertion \n", + "224659 Vacuum Assist chartevents Hemodynamics \n", + "226854 PCWP (v wave) (PA Line) chartevents PA Line Insertion \n", + "\n", + " unitname score \n", + "itemid \n", + "223766 mmHg 110.0 \n", + "228149 mmHg 110.0 \n", + "224151 mmHg 110.0 \n", + "224643 mmHg 110.0 \n", + "224654 mmHg 110.0 \n", + "226855 mmHg 110.0 \n", + "226857 mmHg 110.0 \n", + "224646 mmHg 110.0 \n", + "227716 mmHg 110.0 \n", + "227717 mmHg 110.0 \n", + "224645 mmHg 110.0 \n", + "227242 mmHg 110.0 \n", + "226766 mmHg 110.0 \n", + "227243 mmHg 110.0 \n", + "226853 mmHg 110.0 \n", + "226849 mmHg 110.0 \n", + "226850 mmHg 110.0 \n", + "226851 mmHg 110.0 \n", + "224659 mmHg 110.0 \n", + "226854 mmHg 110.0 " + ] + }, + "execution_count": 71, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [220050]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [220051]\n", + "out_df.iloc[60:80]" + ] + }, + { + "cell_type": "code", + "execution_count": 72, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>228158</th>\n", + " <td>Purge Pressure</td>\n", + " <td>Purge Pressure</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226852</th>\n", + " <td>PA systolic pressure(PA Line)</td>\n", + " <td>PA systolic pressure(PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224652</th>\n", + " <td>Unassisted Systole</td>\n", + " <td>SYS - Unassisted</td>\n", + " <td>chartevents</td>\n", + " <td>IABP</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7643</th>\n", + " <td>RVSYSTOLIC</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>102.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8441</th>\n", + " <td>NBP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8364</th>\n", + " <td>ABP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8448</th>\n", + " <td>PAP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>455</th>\n", + " <td>NBP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>ABP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>492</th>\n", + " <td>PAP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8508</th>\n", + " <td>BP UAC [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>89.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8505</th>\n", + " <td>BP PAL [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>89.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3319</th>\n", + " <td>BP PAL [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3325</th>\n", + " <td>BP UAC [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8502</th>\n", + " <td>BP Cuff [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>87.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3313</th>\n", + " <td>BP Cuff [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>86.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>153</th>\n", + " <td>Diastolic Unloading</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>86.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227539</th>\n", + " <td>ART Blood Pressure Alarm Source</td>\n", + " <td>ART BP Alarm Source</td>\n", + " <td></td>\n", + " <td>Alarms</td>\n", + " <td></td>\n", + " <td>84.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8440</th>\n", + " <td>Manual BP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>666</th>\n", + " <td>Systolic Unloading</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "228158 Purge Pressure Purge Pressure \n", + "226852 PA systolic pressure(PA Line) PA systolic pressure(PA Line) \n", + "224652 Unassisted Systole SYS - Unassisted \n", + "7643 RVSYSTOLIC \n", + "8441 NBP [Diastolic] \n", + "8364 ABP [Diastolic] \n", + "8448 PAP [Diastolic] \n", + "455 NBP [Systolic] \n", + "6 ABP [Systolic] \n", + "492 PAP [Systolic] \n", + "8508 BP UAC [Diastolic] \n", + "8505 BP PAL [Diastolic] \n", + "3319 BP PAL [Systolic] \n", + "3325 BP UAC [Systolic] \n", + "8502 BP Cuff [Diastolic] \n", + "3313 BP Cuff [Systolic] \n", + "153 Diastolic Unloading \n", + "227539 ART Blood Pressure Alarm Source ART BP Alarm Source \n", + "8440 Manual BP [Diastolic] \n", + "666 Systolic Unloading \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "228158 chartevents Impella mmHg 110.000000 \n", + "226852 chartevents PA Line Insertion mmHg 110.000000 \n", + "224652 chartevents IABP mmHg 110.000000 \n", + "7643 chartevents 102.666667 \n", + "8441 chartevents 95.666667 \n", + "8364 chartevents 95.666667 \n", + "8448 chartevents 95.666667 \n", + "455 chartevents 94.333333 \n", + "6 chartevents 94.333333 \n", + "492 chartevents 94.333333 \n", + "8508 chartevents 89.666667 \n", + "8505 chartevents 89.666667 \n", + "3319 chartevents 88.000000 \n", + "3325 chartevents 88.000000 \n", + "8502 chartevents 87.666667 \n", + "3313 chartevents 86.333333 \n", + "153 chartevents 86.000000 \n", + "227539 Alarms 84.666667 \n", + "8440 chartevents 84.666667 \n", + "666 chartevents 84.666667 " + ] + }, + "execution_count": 72, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [227243]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [227242]\n", + "out_df.iloc[80:100]" + ] + }, + { + "cell_type": "code", + "execution_count": 73, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>6417</th>\n", + " <td>low pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7133</th>\n", + " <td>abd pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6944</th>\n", + " <td>LOW PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2027</th>\n", + " <td>Low pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6107</th>\n", + " <td>Low Pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>442</th>\n", + " <td>Manual BP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>83.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8503</th>\n", + " <td>BP Left Arm [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8504</th>\n", + " <td>BP Left Leg [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8368</th>\n", + " <td>Arterial BP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8506</th>\n", + " <td>BP Right Arm [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8507</th>\n", + " <td>BP Right Leg [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51</th>\n", + " <td>Arterial BP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3315</th>\n", + " <td>BP Left Arm [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3317</th>\n", + " <td>BP Left Leg [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3321</th>\n", + " <td>BP Right Arm [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3323</th>\n", + " <td>BP Right Leg [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8555</th>\n", + " <td>Arterial BP #2 [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>29</th>\n", + " <td>Access mmHg</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44560</th>\n", + " <td>blood</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>70015</th>\n", + " <td>BLOOD</td>\n", + " <td></td>\n", + " <td>microbiologyevents</td>\n", + " <td>SPECIMEN</td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto category \\\n", + "itemid \n", + "6417 low pressure chartevents \n", + "7133 abd pressure chartevents \n", + "6944 LOW PRESSURE chartevents \n", + "2027 Low pressure chartevents \n", + "6107 Low Pressure chartevents \n", + "442 Manual BP [Systolic] chartevents \n", + "8503 BP Left Arm [Diastolic] chartevents \n", + "8504 BP Left Leg [Diastolic] chartevents \n", + "8368 Arterial BP [Diastolic] chartevents \n", + "8506 BP Right Arm [Diastolic] chartevents \n", + "8507 BP Right Leg [Diastolic] chartevents \n", + "51 Arterial BP [Systolic] chartevents \n", + "3315 BP Left Arm [Systolic] chartevents \n", + "3317 BP Left Leg [Systolic] chartevents \n", + "3321 BP Right Arm [Systolic] chartevents \n", + "3323 BP Right Leg [Systolic] chartevents \n", + "8555 Arterial BP #2 [Diastolic] chartevents \n", + "29 Access mmHg chartevents \n", + "44560 blood inputevents_cv \n", + "70015 BLOOD microbiologyevents SPECIMEN \n", + "\n", + " unitname score \n", + "itemid \n", + "6417 84.333333 \n", + "7133 84.333333 \n", + "6944 84.333333 \n", + "2027 84.333333 \n", + "6107 84.333333 \n", + "442 83.000000 \n", + "8503 82.000000 \n", + "8504 82.000000 \n", + "8368 82.000000 \n", + "8506 81.000000 \n", + "8507 81.000000 \n", + "51 80.000000 \n", + "3315 80.000000 \n", + "3317 80.000000 \n", + "3321 79.000000 \n", + "3323 79.000000 \n", + "8555 79.000000 \n", + "29 78.666667 \n", + "44560 78.666667 \n", + "70015 78.666667 " + ] + }, + "execution_count": 73, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [455,6]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8441,8364]\n", + "out_df.iloc[100:120]" + ] + }, + { + "cell_type": "code", + "execution_count": 74, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>51466</th>\n", + " <td>BLOOD</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6127</th>\n", + " <td>LO Press</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46780</th>\n", + " <td>Bladdar pressure</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1404</th>\n", + " <td>Bladder pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>993</th>\n", + " <td>bladder pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6701</th>\n", + " <td>Arterial BP #2 [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1411</th>\n", + " <td>Bladder Pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>996</th>\n", + " <td>BLADDER PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44862</th>\n", + " <td>BLADDER PRESSURE</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>77.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>770</th>\n", + " <td>AST</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Enzymes</td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220587</th>\n", + " <td>AST</td>\n", + " <td>AST</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>None</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2347</th>\n", + " <td>BLADDER PRESSURE.</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>76.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6631</th>\n", + " <td>pressure low</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>75.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3108</th>\n", + " <td>PA PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>75.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7504</th>\n", + " <td>Driv pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>75.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2779</th>\n", + " <td>bladder pressures</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>75.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43763</th>\n", + " <td>Bladder presure</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>74.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1509</th>\n", + " <td>bld pres</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>73.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6540</th>\n", + " <td>IntraABd pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>73.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8444</th>\n", + " <td>Orthostat BP sitting [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>73.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "51466 BLOOD NaN labevents \n", + "6127 LO Press chartevents \n", + "46780 Bladdar pressure inputevents_cv \n", + "1404 Bladder pressure chartevents \n", + "993 bladder pressure chartevents \n", + "6701 Arterial BP #2 [Systolic] chartevents \n", + "1411 Bladder Pressure chartevents \n", + "996 BLADDER PRESSURE chartevents \n", + "44862 BLADDER PRESSURE inputevents_cv \n", + "770 AST chartevents \n", + "220587 AST AST chartevents \n", + "2347 BLADDER PRESSURE. chartevents \n", + "6631 pressure low chartevents \n", + "3108 PA PRESSURE chartevents \n", + "7504 Driv pressure chartevents \n", + "2779 bladder pressures chartevents \n", + "43763 Bladder presure inputevents_cv \n", + "1509 bld pres chartevents \n", + "6540 IntraABd pressure chartevents \n", + "8444 Orthostat BP sitting [Diastolic] chartevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "51466 HEMATOLOGY NaN 78.666667 \n", + "6127 78.000000 \n", + "46780 77.000000 \n", + "1404 77.000000 \n", + "993 77.000000 \n", + "6701 77.000000 \n", + "1411 77.000000 \n", + "996 77.000000 \n", + "44862 Free Form Intake 77.000000 \n", + "770 Enzymes 76.666667 \n", + "220587 Labs None 76.666667 \n", + "2347 76.000000 \n", + "6631 75.666667 \n", + "3108 75.333333 \n", + "7504 75.000000 \n", + "2779 75.000000 \n", + "43763 74.333333 \n", + "1509 73.666667 \n", + "6540 73.666667 \n", + "8444 73.333333 " + ] + }, + "execution_count": 74, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [3313]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8502,8440]\n", + "out_df.iloc[120:140]" + ] + }, + { + "cell_type": "code", + "execution_count": 75, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>8446</th>\n", + " <td>Orthostatic BP lying [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>73.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8445</th>\n", + " <td>OrthostatBP standing [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>73.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6302</th>\n", + " <td>low press</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>72.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2562</th>\n", + " <td>INTRA ABD PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>72.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45682</th>\n", + " <td>bladder pressure in</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>72.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7124</th>\n", + " <td>Low pressure Alarm</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>72.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43744</th>\n", + " <td>NS bladder pressure</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>72.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228151</th>\n", + " <td>Aortic Pressure Signal - Diastolic</td>\n", + " <td>Aortic Pressure Signal - Diastolic</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>None</td>\n", + " <td>72.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42735</th>\n", + " <td>Intra-abd. Pressure</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>71.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>484</th>\n", + " <td>Orthostatic BP lying [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>482</th>\n", + " <td>OrthostatBP standing [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>480</th>\n", + " <td>Orthostat BP sitting [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44344</th>\n", + " <td>BLADDER PRESSURE FLD</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>71.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44187</th>\n", + " <td>Blood emesis</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>71.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3238</th>\n", + " <td>CSF PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>71.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2965</th>\n", + " <td>INTRAABDOM. PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>70.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228152</th>\n", + " <td>Aortic Pressure Signal - Systolic</td>\n", + " <td>Aortic Pressure Signal - Systolic</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>None</td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50934</th>\n", + " <td>H</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>CHEMISTRY</td>\n", + " <td>NaN</td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7574</th>\n", + " <td>lumbar pressure</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>69.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2704</th>\n", + " <td>ABDOMINAL PRESSURE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>69.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label \\\n", + "itemid \n", + "8446 Orthostatic BP lying [Diastolic] \n", + "8445 OrthostatBP standing [Diastolic] \n", + "6302 low press \n", + "2562 INTRA ABD PRESSURE \n", + "45682 bladder pressure in \n", + "7124 Low pressure Alarm \n", + "43744 NS bladder pressure \n", + "228151 Aortic Pressure Signal - Diastolic \n", + "42735 Intra-abd. Pressure \n", + "484 Orthostatic BP lying [Systolic] \n", + "482 OrthostatBP standing [Systolic] \n", + "480 Orthostat BP sitting [Systolic] \n", + "44344 BLADDER PRESSURE FLD \n", + "44187 Blood emesis \n", + "3238 CSF PRESSURE \n", + "2965 INTRAABDOM. PRESSURE \n", + "228152 Aortic Pressure Signal - Systolic \n", + "50934 H \n", + "7574 lumbar pressure \n", + "2704 ABDOMINAL PRESSURE \n", + "\n", + " abbreviation linksto category \\\n", + "itemid \n", + "8446 chartevents \n", + "8445 chartevents \n", + "6302 chartevents \n", + "2562 chartevents \n", + "45682 inputevents_cv Free Form Intake \n", + "7124 chartevents \n", + "43744 inputevents_cv Free Form Intake \n", + "228151 Aortic Pressure Signal - Diastolic chartevents Impella \n", + "42735 inputevents_cv Free Form Intake \n", + "484 chartevents \n", + "482 chartevents \n", + "480 chartevents \n", + "44344 inputevents_cv Free Form Intake \n", + "44187 outputevents Free Form Intake \n", + "3238 chartevents \n", + "2965 chartevents \n", + "228152 Aortic Pressure Signal - Systolic chartevents Impella \n", + "50934 NaN labevents CHEMISTRY \n", + "7574 chartevents \n", + "2704 chartevents \n", + "\n", + " unitname score \n", + "itemid \n", + "8446 73.333333 \n", + "8445 73.333333 \n", + "6302 72.666667 \n", + "2562 72.333333 \n", + "45682 72.333333 \n", + "7124 72.333333 \n", + "43744 72.333333 \n", + "228151 None 72.000000 \n", + "42735 71.666667 \n", + "484 71.333333 \n", + "482 71.333333 \n", + "480 71.333333 \n", + "44344 71.000000 \n", + "44187 71.000000 \n", + "3238 71.000000 \n", + "2965 70.333333 \n", + "228152 None 70.000000 \n", + "50934 NaN 70.000000 \n", + "7574 69.666667 \n", + "2704 69.666667 " + ] + }, + "execution_count": 75, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [442,3315,51,3317]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8368,8503,8504,8507,8506]\n", + "out_df.iloc[140:160]" + ] + }, + { + "cell_type": "code", + "execution_count": 76, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [3321,3323]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8555]\n", + "keep_dict[data_dict.labels.BLOOD_PRESSURE_MEAN] = [220181,225312,220052]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [6701]" + ] + }, + { + "cell_type": "code", + "execution_count": 77, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>220179</th>\n", + " <td>Non Invasive Blood Pressure systolic</td>\n", + " <td>NBPs</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225309</th>\n", + " <td>ART BP Systolic</td>\n", + " <td>ART BP Systolic</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224167</th>\n", + " <td>Manual Blood Pressure Systolic Left</td>\n", + " <td>Manual BPs L</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220050</th>\n", + " <td>Arterial Blood Pressure systolic</td>\n", + " <td>ABPs</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227243</th>\n", + " <td>Manual Blood Pressure Systolic Right</td>\n", + " <td>Manual BPs R</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>455</th>\n", + " <td>NBP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>ABP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3313</th>\n", + " <td>BP Cuff [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>86.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>442</th>\n", + " <td>Manual BP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>83.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3315</th>\n", + " <td>BP Left Arm [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51</th>\n", + " <td>Arterial BP [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3317</th>\n", + " <td>BP Left Leg [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3321</th>\n", + " <td>BP Right Arm [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3323</th>\n", + " <td>BP Right Leg [Systolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "220179 Non Invasive Blood Pressure systolic NBPs chartevents \n", + "225309 ART BP Systolic ART BP Systolic chartevents \n", + "224167 Manual Blood Pressure Systolic Left Manual BPs L chartevents \n", + "220050 Arterial Blood Pressure systolic ABPs chartevents \n", + "227243 Manual Blood Pressure Systolic Right Manual BPs R chartevents \n", + "455 NBP [Systolic] chartevents \n", + "6 ABP [Systolic] chartevents \n", + "3313 BP Cuff [Systolic] chartevents \n", + "442 Manual BP [Systolic] chartevents \n", + "3315 BP Left Arm [Systolic] chartevents \n", + "51 Arterial BP [Systolic] chartevents \n", + "3317 BP Left Leg [Systolic] chartevents \n", + "3321 BP Right Arm [Systolic] chartevents \n", + "3323 BP Right Leg [Systolic] chartevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "220179 Routine Vital Signs mmHg 110.000000 \n", + "225309 Routine Vital Signs mmHg 110.000000 \n", + "224167 Routine Vital Signs mmHg 110.000000 \n", + "220050 Routine Vital Signs mmHg 110.000000 \n", + "227243 Routine Vital Signs mmHg 110.000000 \n", + "455 94.333333 \n", + "6 94.333333 \n", + "3313 86.333333 \n", + "442 83.000000 \n", + "3315 80.000000 \n", + "51 80.000000 \n", + "3317 80.000000 \n", + "3321 79.000000 \n", + "3323 79.000000 " + ] + }, + "execution_count": 77, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df.loc[keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC]]" + ] + }, + { + "cell_type": "code", + "execution_count": 79, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>220180</th>\n", + " <td>Non Invasive Blood Pressure diastolic</td>\n", + " <td>NBPd</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225310</th>\n", + " <td>ART BP Diastolic</td>\n", + " <td>ART BP Diastolic</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224643</th>\n", + " <td>Manual Blood Pressure Diastolic Left</td>\n", + " <td>Manual BPd L</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220051</th>\n", + " <td>Arterial Blood Pressure diastolic</td>\n", + " <td>ABPd</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227242</th>\n", + " <td>Manual Blood Pressure Diastolic Right</td>\n", + " <td>Manual BPd R</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>mmHg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8441</th>\n", + " <td>NBP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8364</th>\n", + " <td>ABP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8502</th>\n", + " <td>BP Cuff [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>87.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8440</th>\n", + " <td>Manual BP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8368</th>\n", + " <td>Arterial BP [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8503</th>\n", + " <td>BP Left Arm [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8504</th>\n", + " <td>BP Left Leg [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8507</th>\n", + " <td>BP Right Leg [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8506</th>\n", + " <td>BP Right Arm [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8555</th>\n", + " <td>Arterial BP #2 [Diastolic]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "220180 Non Invasive Blood Pressure diastolic NBPd chartevents \n", + "225310 ART BP Diastolic ART BP Diastolic chartevents \n", + "224643 Manual Blood Pressure Diastolic Left Manual BPd L chartevents \n", + "220051 Arterial Blood Pressure diastolic ABPd chartevents \n", + "227242 Manual Blood Pressure Diastolic Right Manual BPd R chartevents \n", + "8441 NBP [Diastolic] chartevents \n", + "8364 ABP [Diastolic] chartevents \n", + "8502 BP Cuff [Diastolic] chartevents \n", + "8440 Manual BP [Diastolic] chartevents \n", + "8368 Arterial BP [Diastolic] chartevents \n", + "8503 BP Left Arm [Diastolic] chartevents \n", + "8504 BP Left Leg [Diastolic] chartevents \n", + "8507 BP Right Leg [Diastolic] chartevents \n", + "8506 BP Right Arm [Diastolic] chartevents \n", + "8555 Arterial BP #2 [Diastolic] chartevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "220180 Routine Vital Signs mmHg 110.000000 \n", + "225310 Routine Vital Signs mmHg 110.000000 \n", + "224643 Routine Vital Signs mmHg 110.000000 \n", + "220051 Routine Vital Signs mmHg 110.000000 \n", + "227242 Routine Vital Signs mmHg 110.000000 \n", + "8441 95.666667 \n", + "8364 95.666667 \n", + "8502 87.666667 \n", + "8440 84.666667 \n", + "8368 82.000000 \n", + "8503 82.000000 \n", + "8504 82.000000 \n", + "8507 81.000000 \n", + "8506 81.000000 \n", + "8555 79.000000 " + ] + }, + "execution_count": 79, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df.loc[keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC]]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### O2 Sat" + ] + }, + { + "cell_type": "code", + "execution_count": 80, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>50817</th>\n", + " <td>OXYGEN SATURATION</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220277</th>\n", + " <td>O2 saturation pulseoxymetry</td>\n", + " <td>SpO2</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>%</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>646</th>\n", + " <td>SpO2</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228232</th>\n", + " <td>PAR-Oxygen saturation</td>\n", + " <td>PAR-Oxygen saturation</td>\n", + " <td></td>\n", + " <td>Routine Vital Signs</td>\n", + " <td></td>\n", + " <td>102.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3785</th>\n", + " <td>PO2</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>ABG's</td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3837</th>\n", + " <td>pO2</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>ABG'S</td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50821</th>\n", + " <td>PO2</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6719</th>\n", + " <td>SpO2-L</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1341</th>\n", + " <td>PULSE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1725</th>\n", + " <td>Pulse</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1332</th>\n", + " <td>pulse</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50816</th>\n", + " <td>OXYGEN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>78.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2955</th>\n", + " <td>JVO2 SAT</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2574</th>\n", + " <td>MVO2 SAT</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227873</th>\n", + " <td>Recovery O2 Sat - Aerobic Capacity</td>\n", + " <td>Recovery O2 Sat - Aerobic Capacity</td>\n", + " <td>chartevents</td>\n", + " <td>OT Notes</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223772</th>\n", + " <td>SvO2</td>\n", + " <td>SvO2</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223769</th>\n", + " <td>O2 Saturation Pulseoxymetry Alarm - High</td>\n", + " <td>SpO2 Alarm - High</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227867</th>\n", + " <td>Activity O2 Sat - Aerobic Capacity</td>\n", + " <td>Activity O2 Sat - Aerobic Capacity</td>\n", + " <td>chartevents</td>\n", + " <td>OT Notes</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223770</th>\n", + " <td>O2 Saturation Pulseoxymetry Alarm - Low</td>\n", + " <td>SpO2 Alarm - Low</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226861</th>\n", + " <td>ART %O2 saturation (PA Line)</td>\n", + " <td>ART %O2 saturation (PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225674</th>\n", + " <td>Mixed Venous O2% Sat</td>\n", + " <td>Mixed Venous O2% Sat</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226862</th>\n", + " <td>PA %O2 Saturation (PA Line)</td>\n", + " <td>PA %O2 Saturation (PA Line)</td>\n", + " <td>chartevents</td>\n", + " <td>PA Line Insertion</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227686</th>\n", + " <td>Central Venous O2% Sat</td>\n", + " <td>Central Venous O2% Sat</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227546</th>\n", + " <td>SVV (Arterial)</td>\n", + " <td>SVV (Arterial)</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227549</th>\n", + " <td>ScvO2 (Presep)</td>\n", + " <td>ScvO2 (Presep)</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226993</th>\n", + " <td>ApacheIV_LOS</td>\n", + " <td>ApacheIV_LOS</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227008</th>\n", + " <td>Ejection Fraction</td>\n", + " <td>Ejection Fraction</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227010</th>\n", + " <td>FiO2_ApacheIV</td>\n", + " <td>FiO2_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226272</th>\n", + " <td>EF (CCO)</td>\n", + " <td>EF (CCO)</td>\n", + " <td>chartevents</td>\n", + " <td>Hemodynamics</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228184</th>\n", + " <td>SVV (PiCCO)</td>\n", + " <td>SVV (PiCCO)</td>\n", + " <td>chartevents</td>\n", + " <td>PiCCO</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227861</th>\n", + " <td>Rest O2 Sat - Aerobic Capacity</td>\n", + " <td>Rest O2 Sat - Aerobic Capacity</td>\n", + " <td>chartevents</td>\n", + " <td>OT Notes</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226253</th>\n", + " <td>SpO2 Desat Limit</td>\n", + " <td>SpO2 Desat Limit</td>\n", + " <td>chartevents</td>\n", + " <td>Alarms</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224704</th>\n", + " <td>ATC %</td>\n", + " <td>ATC %</td>\n", + " <td>chartevents</td>\n", + " <td>Respiratory</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228378</th>\n", + " <td>TFCd (NICOM)</td>\n", + " <td>TFCd (NICOM)</td>\n", + " <td>chartevents</td>\n", + " <td>NICOM</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226745</th>\n", + " <td>APACHE II Predecited Death Rate</td>\n", + " <td>APACHE II PDR</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227919</th>\n", + " <td>Rest O2 Sat - Aerobic Activity Response</td>\n", + " <td>Rest O2 Sat - Aerobic Activity Response</td>\n", + " <td>chartevents</td>\n", + " <td>OT Notes</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226744</th>\n", + " <td>APACHE II PDR - Adjusted</td>\n", + " <td>APACHE II PDR - Adjusted</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228377</th>\n", + " <td>SVI Change</td>\n", + " <td>SVI Change</td>\n", + " <td>chartevents</td>\n", + " <td>NICOM</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226754</th>\n", + " <td>FiO2ApacheIIValue</td>\n", + " <td>FiO2ApacheIIValue</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228375</th>\n", + " <td>Stroke Volume Index (SVI NICOM)</td>\n", + " <td>Stroke Volume Index (SVI NICOM)</td>\n", + " <td>chartevents</td>\n", + " <td>NICOM</td>\n", + " <td>%</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label \\\n", + "itemid \n", + "50817 OXYGEN SATURATION \n", + "220277 O2 saturation pulseoxymetry \n", + "646 SpO2 \n", + "228232 PAR-Oxygen saturation \n", + "3785 PO2 \n", + "3837 pO2 \n", + "50821 PO2 \n", + "6719 SpO2-L \n", + "1341 PULSE \n", + "1725 Pulse \n", + "1332 pulse \n", + "50816 OXYGEN \n", + "2955 JVO2 SAT \n", + "2574 MVO2 SAT \n", + "227873 Recovery O2 Sat - Aerobic Capacity \n", + "223772 SvO2 \n", + "223769 O2 Saturation Pulseoxymetry Alarm - High \n", + "227867 Activity O2 Sat - Aerobic Capacity \n", + "223770 O2 Saturation Pulseoxymetry Alarm - Low \n", + "226861 ART %O2 saturation (PA Line) \n", + "225674 Mixed Venous O2% Sat \n", + "226862 PA %O2 Saturation (PA Line) \n", + "227686 Central Venous O2% Sat \n", + "227546 SVV (Arterial) \n", + "227549 ScvO2 (Presep) \n", + "226993 ApacheIV_LOS \n", + "227008 Ejection Fraction \n", + "227010 FiO2_ApacheIV \n", + "226272 EF (CCO) \n", + "228184 SVV (PiCCO) \n", + "227861 Rest O2 Sat - Aerobic Capacity \n", + "226253 SpO2 Desat Limit \n", + "224704 ATC % \n", + "228378 TFCd (NICOM) \n", + "226745 APACHE II Predecited Death Rate \n", + "227919 Rest O2 Sat - Aerobic Activity Response \n", + "226744 APACHE II PDR - Adjusted \n", + "228377 SVI Change \n", + "226754 FiO2ApacheIIValue \n", + "228375 Stroke Volume Index (SVI NICOM) \n", + "\n", + " abbreviation linksto \\\n", + "itemid \n", + "50817 NaN labevents \n", + "220277 SpO2 chartevents \n", + "646 chartevents \n", + "228232 PAR-Oxygen saturation \n", + "3785 chartevents \n", + "3837 chartevents \n", + "50821 NaN labevents \n", + "6719 chartevents \n", + "1341 chartevents \n", + "1725 chartevents \n", + "1332 chartevents \n", + "50816 NaN labevents \n", + "2955 chartevents \n", + "2574 chartevents \n", + "227873 Recovery O2 Sat - Aerobic Capacity chartevents \n", + "223772 SvO2 chartevents \n", + "223769 SpO2 Alarm - High chartevents \n", + "227867 Activity O2 Sat - Aerobic Capacity chartevents \n", + "223770 SpO2 Alarm - Low chartevents \n", + "226861 ART %O2 saturation (PA Line) chartevents \n", + "225674 Mixed Venous O2% Sat chartevents \n", + "226862 PA %O2 Saturation (PA Line) chartevents \n", + "227686 Central Venous O2% Sat chartevents \n", + "227546 SVV (Arterial) chartevents \n", + "227549 ScvO2 (Presep) chartevents \n", + "226993 ApacheIV_LOS chartevents \n", + "227008 Ejection Fraction chartevents \n", + "227010 FiO2_ApacheIV chartevents \n", + "226272 EF (CCO) chartevents \n", + "228184 SVV (PiCCO) chartevents \n", + "227861 Rest O2 Sat - Aerobic Capacity chartevents \n", + "226253 SpO2 Desat Limit chartevents \n", + "224704 ATC % chartevents \n", + "228378 TFCd (NICOM) chartevents \n", + "226745 APACHE II PDR chartevents \n", + "227919 Rest O2 Sat - Aerobic Activity Response chartevents \n", + "226744 APACHE II PDR - Adjusted chartevents \n", + "228377 SVI Change chartevents \n", + "226754 FiO2ApacheIIValue chartevents \n", + "228375 Stroke Volume Index (SVI NICOM) chartevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "50817 BLOOD GAS NaN 110.000000 \n", + "220277 Respiratory % 110.000000 \n", + "646 110.000000 \n", + "228232 Routine Vital Signs 102.666667 \n", + "3785 ABG's 100.666667 \n", + "3837 ABG'S 100.666667 \n", + "50821 BLOOD GAS NaN 100.666667 \n", + "6719 96.666667 \n", + "1341 78.666667 \n", + "1725 78.666667 \n", + "1332 78.666667 \n", + "50816 BLOOD GAS NaN 78.000000 \n", + "2955 78.000000 \n", + "2574 78.000000 \n", + "227873 OT Notes % 76.666667 \n", + "223772 Hemodynamics % 76.666667 \n", + "223769 Alarms % 76.666667 \n", + "227867 OT Notes % 76.666667 \n", + "223770 Alarms % 76.666667 \n", + "226861 PA Line Insertion % 76.666667 \n", + "225674 Labs % 76.666667 \n", + "226862 PA Line Insertion % 76.666667 \n", + "227686 Labs % 76.666667 \n", + "227546 Hemodynamics % 76.666667 \n", + "227549 Hemodynamics % 76.666667 \n", + "226993 Scores - APACHE IV (2) % 76.666667 \n", + "227008 Scores - APACHE IV (2) % 76.666667 \n", + "227010 Scores - APACHE IV (2) % 76.666667 \n", + "226272 Hemodynamics % 76.666667 \n", + "228184 PiCCO % 76.666667 \n", + "227861 OT Notes % 76.666667 \n", + "226253 Alarms % 76.666667 \n", + "224704 Respiratory % 76.666667 \n", + "228378 NICOM % 76.666667 \n", + "226745 Scores - APACHE II % 76.666667 \n", + "227919 OT Notes % 76.666667 \n", + "226744 Scores - APACHE II % 76.666667 \n", + "228377 NICOM % 76.666667 \n", + "226754 Scores - APACHE II % 76.666667 \n", + "228375 NICOM % 76.666667 " + ] + }, + "execution_count": 80, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'oxygen saturation',\n", + " 'O2sat',\n", + " 'pulse oximetry',\n", + " '%',\n", + " 'spo2'\n", + " ])\n", + "out_df.head(40)" + ] + }, + { + "cell_type": "code", + "execution_count": 81, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.OXYGEN_SATURATION_PULSE_OXIMETRY] = [646,220277,228232]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Body Temp" + ] + }, + { + "cell_type": "code", + "execution_count": 82, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>50825</th>\n", + " <td>TEMPERATURE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226170</th>\n", + " <td>Head of Bead Measurement</td>\n", + " <td>HOB Measurement</td>\n", + " <td>chartevents</td>\n", + " <td>Treatments</td>\n", + " <td>Degree</td>\n", + " <td>104.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223762</th>\n", + " <td>Temperature Celsius</td>\n", + " <td>Temperature C</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>?C</td>\n", + " <td>104.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223761</th>\n", + " <td>Temperature Fahrenheit</td>\n", + " <td>Temperature F</td>\n", + " <td>chartevents</td>\n", + " <td>Routine Vital Signs</td>\n", + " <td>?F</td>\n", + " <td>104.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>678</th>\n", + " <td>Temperature F</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>104.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>676</th>\n", + " <td>Temperature C</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>104.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>591</th>\n", + " <td>RLE [Temperature]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>98.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>597</th>\n", + " <td>RUE [Temperature]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>98.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224027</th>\n", + " <td>Skin Temperature</td>\n", + " <td>Skin Temp</td>\n", + " <td></td>\n", + " <td>Skin - Assessment</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224642</th>\n", + " <td>Temperature Site</td>\n", + " <td>Temp Site</td>\n", + " <td></td>\n", + " <td>Routine Vital Signs</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>645</th>\n", + " <td>Skin [Temperature]</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>679</th>\n", + " <td>Temperature F (calc)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>92.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>677</th>\n", + " <td>Temperature C (calc)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>92.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227054</th>\n", + " <td>TemperatureF_ApacheIV</td>\n", + " <td>TemperatureF_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>?F</td>\n", + " <td>89.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224769</th>\n", + " <td>LUE Temp</td>\n", + " <td>LUE Temp</td>\n", + " <td></td>\n", + " <td>Cardiovascular</td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224771</th>\n", + " <td>RLE Temp</td>\n", + " <td>RLE Temp</td>\n", + " <td></td>\n", + " <td>Cardiovascular</td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224773</th>\n", + " <td>LLE Temp</td>\n", + " <td>LLE Temp</td>\n", + " <td></td>\n", + " <td>Cardiovascular</td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2798</th>\n", + " <td>arm 90 degrees</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224674</th>\n", + " <td>Changes in Temperature</td>\n", + " <td>Changes in Temperature</td>\n", + " <td></td>\n", + " <td>Toxicology</td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224767</th>\n", + " <td>RUE Temp</td>\n", + " <td>RUE Temp</td>\n", + " <td></td>\n", + " <td>Cardiovascular</td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "50825 TEMPERATURE NaN labevents \n", + "226170 Head of Bead Measurement HOB Measurement chartevents \n", + "223762 Temperature Celsius Temperature C chartevents \n", + "223761 Temperature Fahrenheit Temperature F chartevents \n", + "678 Temperature F chartevents \n", + "676 Temperature C chartevents \n", + "591 RLE [Temperature] chartevents \n", + "597 RUE [Temperature] chartevents \n", + "224027 Skin Temperature Skin Temp \n", + "224642 Temperature Site Temp Site \n", + "645 Skin [Temperature] chartevents \n", + "679 Temperature F (calc) chartevents \n", + "677 Temperature C (calc) chartevents \n", + "227054 TemperatureF_ApacheIV TemperatureF_ApacheIV chartevents \n", + "224769 LUE Temp LUE Temp \n", + "224771 RLE Temp RLE Temp \n", + "224773 LLE Temp LLE Temp \n", + "2798 arm 90 degrees chartevents \n", + "224674 Changes in Temperature Changes in Temperature \n", + "224767 RUE Temp RUE Temp \n", + "\n", + " category unitname score \n", + "itemid \n", + "50825 BLOOD GAS NaN 110.000000 \n", + "226170 Treatments Degree 104.666667 \n", + "223762 Routine Vital Signs ?C 104.666667 \n", + "223761 Routine Vital Signs ?F 104.666667 \n", + "678 104.666667 \n", + "676 104.666667 \n", + "591 98.000000 \n", + "597 98.000000 \n", + "224027 Skin - Assessment 97.333333 \n", + "224642 Routine Vital Signs 97.333333 \n", + "645 95.666667 \n", + "679 92.333333 \n", + "677 92.333333 \n", + "227054 Scores - APACHE IV (2) ?F 89.333333 \n", + "224769 Cardiovascular 88.000000 \n", + "224771 Cardiovascular 88.000000 \n", + "224773 Cardiovascular 88.000000 \n", + "2798 88.000000 \n", + "224674 Toxicology 88.000000 \n", + "224767 Cardiovascular 88.000000 " + ] + }, + "execution_count": 82, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'temperature',\n", + " 'temp',\n", + " 'celcius',\n", + " 'farenheit',\n", + " 'degrees',\n", + " 'deg'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 83, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.TEMPERATURE_BODY] = [223761,678,223762,676]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Weight" + ] + }, + { + "cell_type": "code", + "execution_count": 97, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>763</th>\n", + " <td>Daily Weight</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226512</th>\n", + " <td>Admission Weight (Kg)</td>\n", + " <td>Admission Weight (Kg)</td>\n", + " <td>chartevents</td>\n", + " <td>General</td>\n", + " <td>kg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226846</th>\n", + " <td>Feeding Weight</td>\n", + " <td>Feeding Weight</td>\n", + " <td>chartevents</td>\n", + " <td>General</td>\n", + " <td>kg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224639</th>\n", + " <td>Daily Weight</td>\n", + " <td>Daily Weight</td>\n", + " <td>chartevents</td>\n", + " <td>General</td>\n", + " <td>kg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3693</th>\n", + " <td>Weight Kg</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>968</th>\n", + " <td>EKG</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225402</th>\n", + " <td>EKG</td>\n", + " <td>EKG</td>\n", + " <td>procedureevents_mv</td>\n", + " <td>4-Procedures</td>\n", + " <td>None</td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226184</th>\n", + " <td>Estimated Protein Needs/Kg</td>\n", + " <td>Estimated Protein Needs/Kg</td>\n", + " <td>chartevents</td>\n", + " <td>General</td>\n", + " <td>g/kg</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>733</th>\n", + " <td>Weight Change</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>85.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226707</th>\n", + " <td>Height</td>\n", + " <td>Height</td>\n", + " <td>chartevents</td>\n", + " <td>General</td>\n", + " <td>Inch</td>\n", + " <td>83.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4183</th>\n", + " <td>Birthweight (kg)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228179</th>\n", + " <td>ELWI (PiCCO)</td>\n", + " <td>ELWI (PiCCO)</td>\n", + " <td>chartevents</td>\n", + " <td>PiCCO</td>\n", + " <td>ml/kg</td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>580</th>\n", + " <td>Previous Weight</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43622</th>\n", + " <td>cc/kg</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>581</th>\n", + " <td>Previous WeightF</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7000</th>\n", + " <td>ideal body weight</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45271</th>\n", + " <td>Chucks Pad Weight</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3723</th>\n", + " <td>Birth Weight (kg)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3581</th>\n", + " <td>Present Weight (lb)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>76.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3692</th>\n", + " <td>Weight Change (gms)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>76.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "763 Daily Weight \n", + "226512 Admission Weight (Kg) Admission Weight (Kg) \n", + "226846 Feeding Weight Feeding Weight \n", + "224639 Daily Weight Daily Weight \n", + "3693 Weight Kg \n", + "968 EKG \n", + "225402 EKG EKG \n", + "226184 Estimated Protein Needs/Kg Estimated Protein Needs/Kg \n", + "733 Weight Change \n", + "226707 Height Height \n", + "4183 Birthweight (kg) \n", + "228179 ELWI (PiCCO) ELWI (PiCCO) \n", + "580 Previous Weight \n", + "43622 cc/kg \n", + "581 Previous WeightF \n", + "7000 ideal body weight \n", + "45271 Chucks Pad Weight \n", + "3723 Birth Weight (kg) \n", + "3581 Present Weight (lb) \n", + "3692 Weight Change (gms) \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "763 chartevents 110.000000 \n", + "226512 chartevents General kg 110.000000 \n", + "226846 chartevents General kg 110.000000 \n", + "224639 chartevents General kg 110.000000 \n", + "3693 chartevents 96.666667 \n", + "968 chartevents 96.666667 \n", + "225402 procedureevents_mv 4-Procedures None 96.666667 \n", + "226184 chartevents General g/kg 88.000000 \n", + "733 chartevents 85.333333 \n", + "226707 chartevents General Inch 83.000000 \n", + "4183 chartevents 81.666667 \n", + "228179 chartevents PiCCO ml/kg 81.333333 \n", + "580 chartevents 81.333333 \n", + "43622 inputevents_cv 81.333333 \n", + "581 chartevents 80.000000 \n", + "7000 chartevents 78.000000 \n", + "45271 inputevents_cv 78.000000 \n", + "3723 chartevents 77.666667 \n", + "3581 chartevents 76.000000 \n", + "3692 chartevents 76.000000 " + ] + }, + "execution_count": 97, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'weight',\n", + " 'daily weight',\n", + " 'kg' \n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 98, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.WEIGHT_BODY] =[763,224639,3693]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Urine Output" + ] + }, + { + "cell_type": "code", + "execution_count": 84, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>226560</th>\n", + " <td>Void</td>\n", + " <td>Void</td>\n", + " <td>outputevents</td>\n", + " <td>Output</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43332</th>\n", + " <td>void</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7672</th>\n", + " <td>Foley</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3686</th>\n", + " <td>Void</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45967</th>\n", + " <td>foley</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43053</th>\n", + " <td>URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226559</th>\n", + " <td>Foley</td>\n", + " <td>Foley</td>\n", + " <td>outputevents</td>\n", + " <td>Output</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44103</th>\n", + " <td>ER urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44834</th>\n", + " <td>er urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227519</th>\n", + " <td>Urine output_ApacheIV</td>\n", + " <td>Urine output</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>None</td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44706</th>\n", + " <td>urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42892</th>\n", + " <td>EW URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45415</th>\n", + " <td>ED Urine OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43987</th>\n", + " <td>urine out or</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42666</th>\n", + " <td>E.R. URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44237</th>\n", + " <td>E.R. urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42592</th>\n", + " <td>VICU URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40069</th>\n", + " <td>Urine Out Void</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46423</th>\n", + " <td>ed foley</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43931</th>\n", + " <td>Floor urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "226560 Void Void outputevents \n", + "43332 void inputevents_cv \n", + "7672 Foley chartevents \n", + "3686 Void chartevents \n", + "45967 foley inputevents_cv \n", + "43053 URINE OUT outputevents \n", + "226559 Foley Foley outputevents \n", + "44103 ER urine out outputevents \n", + "44834 er urine out outputevents \n", + "227519 Urine output_ApacheIV Urine output chartevents \n", + "44706 urine output outputevents \n", + "42892 EW URINE OUT outputevents \n", + "45415 ED Urine OUT outputevents \n", + "43987 urine out or outputevents \n", + "42666 E.R. URINE OUT outputevents \n", + "44237 E.R. urine out outputevents \n", + "42592 VICU URINE OUT outputevents \n", + "40069 Urine Out Void outputevents \n", + "46423 ed foley inputevents_cv \n", + "43931 Floor urine out outputevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "226560 Output mL 110.000000 \n", + "43332 110.000000 \n", + "7672 110.000000 \n", + "3686 110.000000 \n", + "45967 110.000000 \n", + "43053 110.000000 \n", + "226559 Output mL 110.000000 \n", + "44103 100.666667 \n", + "44834 100.666667 \n", + "227519 Scores - APACHE IV (2) None 100.666667 \n", + "44706 100.666667 \n", + "42892 100.666667 \n", + "45415 100.666667 \n", + "43987 100.666667 \n", + "42666 96.666667 \n", + "44237 96.666667 \n", + "42592 95.333333 \n", + "40069 95.333333 \n", + "46423 94.666667 \n", + "43931 93.333333 " + ] + }, + "execution_count": 84, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'urine out',\n", + " 'void',\n", + " 'foley'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 85, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>226560</th>\n", + " <td>Void</td>\n", + " <td>Void</td>\n", + " <td>outputevents</td>\n", + " <td>Output</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43332</th>\n", + " <td>void</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7672</th>\n", + " <td>Foley</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3686</th>\n", + " <td>Void</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45967</th>\n", + " <td>foley</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43053</th>\n", + " <td>URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226559</th>\n", + " <td>Foley</td>\n", + " <td>Foley</td>\n", + " <td>outputevents</td>\n", + " <td>Output</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44103</th>\n", + " <td>ER urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44834</th>\n", + " <td>er urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227519</th>\n", + " <td>Urine output_ApacheIV</td>\n", + " <td>Urine output</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>None</td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44706</th>\n", + " <td>urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42892</th>\n", + " <td>EW URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45415</th>\n", + " <td>ED Urine OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43987</th>\n", + " <td>urine out or</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42666</th>\n", + " <td>E.R. URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44237</th>\n", + " <td>E.R. urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42592</th>\n", + " <td>VICU URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40069</th>\n", + " <td>Urine Out Void</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46423</th>\n", + " <td>ed foley</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>94.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43931</th>\n", + " <td>Floor urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43348</th>\n", + " <td>urine output/kg</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40405</th>\n", + " <td>Urine Out Other</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42810</th>\n", + " <td>angio urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46180</th>\n", + " <td>urine out-angio</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40055</th>\n", + " <td>Urine Out Foley</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44253</th>\n", + " <td>Urine out angio</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44325</th>\n", + " <td>ED URINE OUTPUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>41857</th>\n", + " <td>urine out in er</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44824</th>\n", + " <td>EW urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45991</th>\n", + " <td>ew-urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42042</th>\n", + " <td>ANGIO URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46177</th>\n", + " <td>URINE OUT-ANGIO</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44684</th>\n", + " <td>floor urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46658</th>\n", + " <td>ED Urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46578</th>\n", + " <td>URINE OUTPUT-ER</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42765</th>\n", + " <td>FARR 6 URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>91.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>70081</th>\n", + " <td>URINE</td>\n", + " <td></td>\n", + " <td>microbiologyevents</td>\n", + " <td>SPECIMEN</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3819</th>\n", + " <td>Urine Leukocytes</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Urine</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>70079</th>\n", + " <td>URINE</td>\n", + " <td></td>\n", + " <td>microbiologyevents</td>\n", + " <td>SPECIMEN</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43462</th>\n", + " <td>urine</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "226560 Void Void outputevents \n", + "43332 void inputevents_cv \n", + "7672 Foley chartevents \n", + "3686 Void chartevents \n", + "45967 foley inputevents_cv \n", + "43053 URINE OUT outputevents \n", + "226559 Foley Foley outputevents \n", + "44103 ER urine out outputevents \n", + "44834 er urine out outputevents \n", + "227519 Urine output_ApacheIV Urine output chartevents \n", + "44706 urine output outputevents \n", + "42892 EW URINE OUT outputevents \n", + "45415 ED Urine OUT outputevents \n", + "43987 urine out or outputevents \n", + "42666 E.R. URINE OUT outputevents \n", + "44237 E.R. urine out outputevents \n", + "42592 VICU URINE OUT outputevents \n", + "40069 Urine Out Void outputevents \n", + "46423 ed foley inputevents_cv \n", + "43931 Floor urine out outputevents \n", + "43348 urine output/kg outputevents \n", + "40405 Urine Out Other outputevents \n", + "42810 angio urine out outputevents \n", + "46180 urine out-angio outputevents \n", + "40055 Urine Out Foley outputevents \n", + "44253 Urine out angio outputevents \n", + "44325 ED URINE OUTPUT outputevents \n", + "41857 urine out in er outputevents \n", + "44824 EW urine output outputevents \n", + "45991 ew-urine output outputevents \n", + "42042 ANGIO URINE OUT outputevents \n", + "46177 URINE OUT-ANGIO outputevents \n", + "44684 floor urine out outputevents \n", + "46658 ED Urine output outputevents \n", + "46578 URINE OUTPUT-ER outputevents \n", + "42765 FARR 6 URINE OUT outputevents \n", + "70081 URINE microbiologyevents \n", + "3819 Urine Leukocytes chartevents \n", + "70079 URINE microbiologyevents \n", + "43462 urine outputevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "226560 Output mL 110.000000 \n", + "43332 110.000000 \n", + "7672 110.000000 \n", + "3686 110.000000 \n", + "45967 110.000000 \n", + "43053 110.000000 \n", + "226559 Output mL 110.000000 \n", + "44103 100.666667 \n", + "44834 100.666667 \n", + "227519 Scores - APACHE IV (2) None 100.666667 \n", + "44706 100.666667 \n", + "42892 100.666667 \n", + "45415 100.666667 \n", + "43987 100.666667 \n", + "42666 96.666667 \n", + "44237 96.666667 \n", + "42592 95.333333 \n", + "40069 95.333333 \n", + "46423 94.666667 \n", + "43931 93.333333 \n", + "43348 93.333333 \n", + "40405 93.333333 \n", + "42810 93.333333 \n", + "46180 93.333333 \n", + "40055 93.333333 \n", + "44253 93.333333 \n", + "44325 93.333333 \n", + "41857 93.333333 \n", + "44824 93.333333 \n", + "45991 93.333333 \n", + "42042 93.333333 \n", + "46177 93.333333 \n", + "44684 93.333333 \n", + "46658 93.333333 \n", + "46578 93.333333 \n", + "42765 91.333333 \n", + "70081 SPECIMEN 90.666667 \n", + "3819 Urine 90.666667 \n", + "70079 SPECIMEN 90.666667 \n", + "43462 90.666667 " + ] + }, + "execution_count": 85, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df.head(40)" + ] + }, + { + "cell_type": "code", + "execution_count": 86, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "out_df = out_df[out_df.linksto.isin(['outputevents','chartevents'])]" + ] + }, + { + "cell_type": "code", + "execution_count": 87, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>226560</th>\n", + " <td>Void</td>\n", + " <td>Void</td>\n", + " <td>outputevents</td>\n", + " <td>Output</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7672</th>\n", + " <td>Foley</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3686</th>\n", + " <td>Void</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43053</th>\n", + " <td>URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226559</th>\n", + " <td>Foley</td>\n", + " <td>Foley</td>\n", + " <td>outputevents</td>\n", + " <td>Output</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44103</th>\n", + " <td>ER urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44834</th>\n", + " <td>er urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227519</th>\n", + " <td>Urine output_ApacheIV</td>\n", + " <td>Urine output</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>None</td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44706</th>\n", + " <td>urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42892</th>\n", + " <td>EW URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45415</th>\n", + " <td>ED Urine OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43987</th>\n", + " <td>urine out or</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42666</th>\n", + " <td>E.R. URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44237</th>\n", + " <td>E.R. urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42592</th>\n", + " <td>VICU URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40069</th>\n", + " <td>Urine Out Void</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>95.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43931</th>\n", + " <td>Floor urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43348</th>\n", + " <td>urine output/kg</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40405</th>\n", + " <td>Urine Out Other</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42810</th>\n", + " <td>angio urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46180</th>\n", + " <td>urine out-angio</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40055</th>\n", + " <td>Urine Out Foley</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44253</th>\n", + " <td>Urine out angio</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44325</th>\n", + " <td>ED URINE OUTPUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>41857</th>\n", + " <td>urine out in er</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44824</th>\n", + " <td>EW urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45991</th>\n", + " <td>ew-urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42042</th>\n", + " <td>ANGIO URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46177</th>\n", + " <td>URINE OUT-ANGIO</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44684</th>\n", + " <td>floor urine out</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46658</th>\n", + " <td>ED Urine output</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46578</th>\n", + " <td>URINE OUTPUT-ER</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>93.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42765</th>\n", + " <td>FARR 6 URINE OUT</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>91.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3819</th>\n", + " <td>Urine Leukocytes</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Urine</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43462</th>\n", + " <td>urine</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3816</th>\n", + " <td>Urine Glucose</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Urine</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3817</th>\n", + " <td>Urine Heme</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Urine</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3818</th>\n", + " <td>Urine Ketones</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Urine</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3822</th>\n", + " <td>Urine Protein</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Urine</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6298</th>\n", + " <td>foley d/c</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "226560 Void Void outputevents \n", + "7672 Foley chartevents \n", + "3686 Void chartevents \n", + "43053 URINE OUT outputevents \n", + "226559 Foley Foley outputevents \n", + "44103 ER urine out outputevents \n", + "44834 er urine out outputevents \n", + "227519 Urine output_ApacheIV Urine output chartevents \n", + "44706 urine output outputevents \n", + "42892 EW URINE OUT outputevents \n", + "45415 ED Urine OUT outputevents \n", + "43987 urine out or outputevents \n", + "42666 E.R. URINE OUT outputevents \n", + "44237 E.R. urine out outputevents \n", + "42592 VICU URINE OUT outputevents \n", + "40069 Urine Out Void outputevents \n", + "43931 Floor urine out outputevents \n", + "43348 urine output/kg outputevents \n", + "40405 Urine Out Other outputevents \n", + "42810 angio urine out outputevents \n", + "46180 urine out-angio outputevents \n", + "40055 Urine Out Foley outputevents \n", + "44253 Urine out angio outputevents \n", + "44325 ED URINE OUTPUT outputevents \n", + "41857 urine out in er outputevents \n", + "44824 EW urine output outputevents \n", + "45991 ew-urine output outputevents \n", + "42042 ANGIO URINE OUT outputevents \n", + "46177 URINE OUT-ANGIO outputevents \n", + "44684 floor urine out outputevents \n", + "46658 ED Urine output outputevents \n", + "46578 URINE OUTPUT-ER outputevents \n", + "42765 FARR 6 URINE OUT outputevents \n", + "3819 Urine Leukocytes chartevents \n", + "43462 urine outputevents \n", + "3816 Urine Glucose chartevents \n", + "3817 Urine Heme chartevents \n", + "3818 Urine Ketones chartevents \n", + "3822 Urine Protein chartevents \n", + "6298 foley d/c chartevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "226560 Output mL 110.000000 \n", + "7672 110.000000 \n", + "3686 110.000000 \n", + "43053 110.000000 \n", + "226559 Output mL 110.000000 \n", + "44103 100.666667 \n", + "44834 100.666667 \n", + "227519 Scores - APACHE IV (2) None 100.666667 \n", + "44706 100.666667 \n", + "42892 100.666667 \n", + "45415 100.666667 \n", + "43987 100.666667 \n", + "42666 96.666667 \n", + "44237 96.666667 \n", + "42592 95.333333 \n", + "40069 95.333333 \n", + "43931 93.333333 \n", + "43348 93.333333 \n", + "40405 93.333333 \n", + "42810 93.333333 \n", + "46180 93.333333 \n", + "40055 93.333333 \n", + "44253 93.333333 \n", + "44325 93.333333 \n", + "41857 93.333333 \n", + "44824 93.333333 \n", + "45991 93.333333 \n", + "42042 93.333333 \n", + "46177 93.333333 \n", + "44684 93.333333 \n", + "46658 93.333333 \n", + "46578 93.333333 \n", + "42765 91.333333 \n", + "3819 Urine 90.666667 \n", + "43462 90.666667 \n", + "3816 Urine 90.666667 \n", + "3817 Urine 90.666667 \n", + "3818 Urine 90.666667 \n", + "3822 Urine 90.666667 \n", + "6298 90.666667 " + ] + }, + "execution_count": 87, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df.head(40)" + ] + }, + { + "cell_type": "code", + "execution_count": 91, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "out_df.drop(227519,axis=0,inplace=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 96, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.OUTPUT_URINE] = out_df.loc[:46578].index.unique().tolist()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "https://github.com/MIT-LCP/mimic-code/blob/travis/concepts/cookbook/uo.sql" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.OUTPUT_URINE] = keep_dict[data_dict.labels.OUTPUT_URINE]\n", + "to_add = [43175,40094,40715,40473,40085,40057,40056,40428,40086,40096,40651]\n", + "to_add += [227510,226561,226584,226563,226564,226565,226567,226557,226558 ]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Glasgow Coma Scale (GCS)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Eye Opening" + ] + }, + { + "cell_type": "code", + "execution_count": 99, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>184</th>\n", + " <td>Eye Opening</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220739</th>\n", + " <td>GCS - Eye Opening</td>\n", + " <td>Eye Opening</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>198</th>\n", + " <td>GCS Total</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>70033</th>\n", + " <td>EYE</td>\n", + " <td></td>\n", + " <td>microbiologyevents</td>\n", + " <td>SPECIMEN</td>\n", + " <td></td>\n", + " <td>72.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3742</th>\n", + " <td>Basos</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3791</th>\n", + " <td>Polys</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3779</th>\n", + " <td>Monos</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2834</th>\n", + " <td>ICS</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227011</th>\n", + " <td>GCSEye_ApacheIV</td>\n", + " <td>GCSEye_ApacheIV</td>\n", + " <td></td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td></td>\n", + " <td>65.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226755</th>\n", + " <td>GcsApacheIIScore</td>\n", + " <td>GcsApacheIIScore</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>None</td>\n", + " <td>64.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>41556</th>\n", + " <td>ng</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>64.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227012</th>\n", + " <td>GCSMotor_ApacheIV</td>\n", + " <td>GCSMotor_ApacheIV</td>\n", + " <td></td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td></td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227013</th>\n", + " <td>GcsScore_ApacheIV</td>\n", + " <td>GcsScore_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>None</td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5700</th>\n", + " <td>Gent eye oint</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>63.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227014</th>\n", + " <td>GCSVerbal_ApacheIV</td>\n", + " <td>GCSVerbal_ApacheIV</td>\n", + " <td></td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td></td>\n", + " <td>62.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50931</th>\n", + " <td>GLUCOSE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>CHEMISTRY</td>\n", + " <td>NaN</td>\n", + " <td>62.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1529</th>\n", + " <td>Glucose</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Chemistry</td>\n", + " <td></td>\n", + " <td>62.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50809</th>\n", + " <td>GLUCOSE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>62.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51478</th>\n", + " <td>GLUCOSE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>62.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223901</th>\n", + " <td>GCS - Motor Response</td>\n", + " <td>Motor Response</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>61.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "184 Eye Opening chartevents \n", + "220739 GCS - Eye Opening Eye Opening \n", + "198 GCS Total chartevents \n", + "70033 EYE microbiologyevents \n", + "3742 Basos chartevents \n", + "3791 Polys chartevents \n", + "3779 Monos chartevents \n", + "2834 ICS chartevents \n", + "227011 GCSEye_ApacheIV GCSEye_ApacheIV \n", + "226755 GcsApacheIIScore GcsApacheIIScore chartevents \n", + "41556 ng inputevents_cv \n", + "227012 GCSMotor_ApacheIV GCSMotor_ApacheIV \n", + "227013 GcsScore_ApacheIV GcsScore_ApacheIV chartevents \n", + "5700 Gent eye oint chartevents \n", + "227014 GCSVerbal_ApacheIV GCSVerbal_ApacheIV \n", + "50931 GLUCOSE NaN labevents \n", + "1529 Glucose chartevents \n", + "50809 GLUCOSE NaN labevents \n", + "51478 GLUCOSE NaN labevents \n", + "223901 GCS - Motor Response Motor Response \n", + "\n", + " category unitname score \n", + "itemid \n", + "184 110.000000 \n", + "220739 Neurological 110.000000 \n", + "198 76.666667 \n", + "70033 SPECIMEN 72.000000 \n", + "3742 CSF 71.333333 \n", + "3791 CSF 71.333333 \n", + "3779 CSF 71.333333 \n", + "2834 67.000000 \n", + "227011 Scores - APACHE IV (2) 65.333333 \n", + "226755 Scores - APACHE II None 64.666667 \n", + "41556 64.000000 \n", + "227012 Scores - APACHE IV (2) 63.333333 \n", + "227013 Scores - APACHE IV (2) None 63.333333 \n", + "5700 63.000000 \n", + "227014 Scores - APACHE IV (2) 62.666667 \n", + "50931 CHEMISTRY NaN 62.333333 \n", + "1529 Chemistry 62.333333 \n", + "50809 BLOOD GAS NaN 62.333333 \n", + "51478 HEMATOLOGY NaN 62.333333 \n", + "223901 Neurological 61.666667 " + ] + }, + "execution_count": 99, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'glasgow come scale',\n", + " 'GCS',\n", + " 'eye opening'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 100, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.GLASGOW_COMA_SCALE_EYE_OPENING] = [184,220739]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Motor" + ] + }, + { + "cell_type": "code", + "execution_count": 101, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>228405</th>\n", + " <td>Motor L Leg</td>\n", + " <td>Motor L Leg</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>85.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228404</th>\n", + " <td>Motor L Arm</td>\n", + " <td>Motor L Arm</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>85.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228407</th>\n", + " <td>Motor R Leg</td>\n", + " <td>Motor R Leg</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>85.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228406</th>\n", + " <td>Motor R Arm</td>\n", + " <td>Motor R Arm</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>85.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227120</th>\n", + " <td>Motor Deficit</td>\n", + " <td>Motor Deficit</td>\n", + " <td></td>\n", + " <td>Pain/Sedation</td>\n", + " <td></td>\n", + " <td>80.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>453</th>\n", + " <td>Motor Deficits</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>454</th>\n", + " <td>Motor Response</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>223901</th>\n", + " <td>GCS - Motor Response</td>\n", + " <td>Motor Response</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>198</th>\n", + " <td>GCS Total</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227012</th>\n", + " <td>GCSMotor_ApacheIV</td>\n", + " <td>GCSMotor_ApacheIV</td>\n", + " <td></td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td></td>\n", + " <td>73.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3779</th>\n", + " <td>Monos</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3742</th>\n", + " <td>Basos</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3791</th>\n", + " <td>Polys</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226757</th>\n", + " <td>GCSMotorApacheIIValue</td>\n", + " <td>GCSMotorApacheIIValue</td>\n", + " <td></td>\n", + " <td>Scores - APACHE II</td>\n", + " <td></td>\n", + " <td>68.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2834</th>\n", + " <td>ICS</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225472</th>\n", + " <td>Pneumothorax</td>\n", + " <td>Pneumothorax</td>\n", + " <td>procedureevents_mv</td>\n", + " <td>3-Significant Events</td>\n", + " <td>None</td>\n", + " <td>66.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227011</th>\n", + " <td>GCSEye_ApacheIV</td>\n", + " <td>GCSEye_ApacheIV</td>\n", + " <td></td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td></td>\n", + " <td>65.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226755</th>\n", + " <td>GcsApacheIIScore</td>\n", + " <td>GcsApacheIIScore</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE II</td>\n", + " <td>None</td>\n", + " <td>64.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220739</th>\n", + " <td>GCS - Eye Opening</td>\n", + " <td>Eye Opening</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>64.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227013</th>\n", + " <td>GcsScore_ApacheIV</td>\n", + " <td>GcsScore_ApacheIV</td>\n", + " <td>chartevents</td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td>None</td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "228405 Motor L Leg Motor L Leg \n", + "228404 Motor L Arm Motor L Arm \n", + "228407 Motor R Leg Motor R Leg \n", + "228406 Motor R Arm Motor R Arm \n", + "227120 Motor Deficit Motor Deficit \n", + "453 Motor Deficits chartevents \n", + "454 Motor Response chartevents \n", + "223901 GCS - Motor Response Motor Response \n", + "198 GCS Total chartevents \n", + "227012 GCSMotor_ApacheIV GCSMotor_ApacheIV \n", + "3779 Monos chartevents \n", + "3742 Basos chartevents \n", + "3791 Polys chartevents \n", + "226757 GCSMotorApacheIIValue GCSMotorApacheIIValue \n", + "2834 ICS chartevents \n", + "225472 Pneumothorax Pneumothorax procedureevents_mv \n", + "227011 GCSEye_ApacheIV GCSEye_ApacheIV \n", + "226755 GcsApacheIIScore GcsApacheIIScore chartevents \n", + "220739 GCS - Eye Opening Eye Opening \n", + "227013 GcsScore_ApacheIV GcsScore_ApacheIV chartevents \n", + "\n", + " category unitname score \n", + "itemid \n", + "228405 Neurological 85.333333 \n", + "228404 Neurological 85.333333 \n", + "228407 Neurological 85.333333 \n", + "228406 Neurological 85.333333 \n", + "227120 Pain/Sedation 80.666667 \n", + "453 78.666667 \n", + "454 78.666667 \n", + "223901 Neurological 78.666667 \n", + "198 76.666667 \n", + "227012 Scores - APACHE IV (2) 73.333333 \n", + "3779 CSF 71.333333 \n", + "3742 CSF 71.333333 \n", + "3791 CSF 71.333333 \n", + "226757 Scores - APACHE II 68.666667 \n", + "2834 67.000000 \n", + "225472 3-Significant Events None 66.000000 \n", + "227011 Scores - APACHE IV (2) 65.333333 \n", + "226755 Scores - APACHE II None 64.666667 \n", + "220739 Neurological 64.333333 \n", + "227013 Scores - APACHE IV (2) None 63.333333 " + ] + }, + "execution_count": 101, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'glasgow come scale',\n", + " 'GCS',\n", + " 'motor',\n", + " 'motor response'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 102, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.GLASGOW_COMA_SCALE_MOTOR] = [454,223901]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Verbal" + ] + }, + { + "cell_type": "code", + "execution_count": 103, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>223900</th>\n", + " <td>GCS - Verbal Response</td>\n", + " <td>Verbal Response</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>723</th>\n", + " <td>Verbal Response</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224756</th>\n", + " <td>Response</td>\n", + " <td>Response</td>\n", + " <td></td>\n", + " <td>Neurological</td>\n", + " <td></td>\n", + " <td>90.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>41610</th>\n", + " <td>ER</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227014</th>\n", + " <td>GCSVerbal_ApacheIV</td>\n", + " <td>GCSVerbal_ApacheIV</td>\n", + " <td></td>\n", + " <td>Scores - APACHE IV (2)</td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44473</th>\n", + " <td>er</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>198</th>\n", + " <td>GCS Total</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226758</th>\n", + " <td>GCSVerbalApacheIIValue</td>\n", + " <td>GCSVerbalApacheIIValue</td>\n", + " <td></td>\n", + " <td>Scores - APACHE II</td>\n", + " <td></td>\n", + " <td>72.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3779</th>\n", + " <td>Monos</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3742</th>\n", + " <td>Basos</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3791</th>\n", + " <td>Polys</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>CSF</td>\n", + " <td></td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224413</th>\n", + " <td>TOF Response</td>\n", + " <td>TOF Response</td>\n", + " <td></td>\n", + " <td>Pain/Sedation</td>\n", + " <td></td>\n", + " <td>69.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>40450</th>\n", + " <td>EBL</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>41693</th>\n", + " <td>Verapamil</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1968</th>\n", + " <td>Verapamil</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42047</th>\n", + " <td>ebl</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>222318</th>\n", + " <td>Verapamil</td>\n", + " <td>Verapamil</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46484</th>\n", + " <td>verapamil</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2834</th>\n", + " <td>ICS</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>224409</th>\n", + " <td>Pain Level Response</td>\n", + " <td>Pain Level Response</td>\n", + " <td></td>\n", + " <td>Pain/Sedation</td>\n", + " <td></td>\n", + " <td>66.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "223900 GCS - Verbal Response Verbal Response \n", + "723 Verbal Response chartevents \n", + "224756 Response Response \n", + "41610 ER inputevents_cv \n", + "227014 GCSVerbal_ApacheIV GCSVerbal_ApacheIV \n", + "44473 er inputevents_cv \n", + "198 GCS Total chartevents \n", + "226758 GCSVerbalApacheIIValue GCSVerbalApacheIIValue \n", + "3779 Monos chartevents \n", + "3742 Basos chartevents \n", + "3791 Polys chartevents \n", + "224413 TOF Response TOF Response \n", + "40450 EBL inputevents_cv \n", + "41693 Verapamil inputevents_cv \n", + "1968 Verapamil chartevents \n", + "42047 ebl inputevents_cv \n", + "222318 Verapamil Verapamil inputevents_mv \n", + "46484 verapamil inputevents_cv \n", + "2834 ICS chartevents \n", + "224409 Pain Level Response Pain Level Response \n", + "\n", + " category unitname score \n", + "itemid \n", + "223900 Neurological 110.000000 \n", + "723 110.000000 \n", + "224756 Neurological 90.000000 \n", + "41610 Free Form Intake 76.666667 \n", + "227014 Scores - APACHE IV (2) 76.666667 \n", + "44473 Free Form Intake 76.666667 \n", + "198 76.666667 \n", + "226758 Scores - APACHE II 72.000000 \n", + "3779 CSF 71.333333 \n", + "3742 CSF 71.333333 \n", + "3791 CSF 71.333333 \n", + "224413 Pain/Sedation 69.666667 \n", + "40450 67.000000 \n", + "41693 Free Form Intake 67.000000 \n", + "1968 67.000000 \n", + "42047 67.000000 \n", + "222318 Medications mg 67.000000 \n", + "46484 Free Form Intake 67.000000 \n", + "2834 67.000000 \n", + "224409 Pain/Sedation 66.000000 " + ] + }, + "execution_count": 103, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'glasgow come scale',\n", + " 'GCS',\n", + " 'verbal',\n", + " 'verbal response'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 104, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.GLASGOW_COMA_SCALE_VERBAL] = [723,223900]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Labs\n", + "\n", + "### Lactate" + ] + }, + { + "cell_type": "code", + "execution_count": 105, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>1531</th>\n", + " <td>Lactic Acid</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Chemistry</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225668</th>\n", + " <td>Lactic Acid</td>\n", + " <td>Lactic Acid</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>None</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50813</th>\n", + " <td>LACTATE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220228</th>\n", + " <td>Hemoglobin</td>\n", + " <td>Hemoglobin</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>g/dl</td>\n", + " <td>102.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2773</th>\n", + " <td>sjlactate</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>102.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225835</th>\n", + " <td>Na Phos</td>\n", + " <td>Na Phos</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mmol</td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225834</th>\n", + " <td>K Phos</td>\n", + " <td>K Phos</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mmol</td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227526</th>\n", + " <td>Citrate</td>\n", + " <td>Citrate</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mmol</td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225925</th>\n", + " <td>Potassium Phosphate</td>\n", + " <td>Potassium Phosphate</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Nutrition - Supplements</td>\n", + " <td>mmol</td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>818</th>\n", + " <td>Lactic Acid(0.5-2.0)</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Chemistry</td>\n", + " <td></td>\n", + " <td>91.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220955</th>\n", + " <td>Ringers Lactate</td>\n", + " <td>Ringers Lactate</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>86.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2638</th>\n", + " <td>CEREBRAL LACTATE</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1634</th>\n", + " <td>lactated ringers</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30021</th>\n", + " <td>Lactated Ringers</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1520</th>\n", + " <td>ACT</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Coags</td>\n", + " <td></td>\n", + " <td>83.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220507</th>\n", + " <td>Activated Clotting Time</td>\n", + " <td>ACT</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>None</td>\n", + " <td>83.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1671</th>\n", + " <td>act</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>83.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221319</th>\n", + " <td>Alteplase (TPA)</td>\n", + " <td>Alteplase (TPA)</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221347</th>\n", + " <td>Amiodarone</td>\n", + " <td>Amiodarone</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221342</th>\n", + " <td>Aminophylline</td>\n", + " <td>Aminophylline</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "1531 Lactic Acid chartevents \n", + "225668 Lactic Acid Lactic Acid chartevents \n", + "50813 LACTATE NaN labevents \n", + "220228 Hemoglobin Hemoglobin chartevents \n", + "2773 sjlactate chartevents \n", + "225835 Na Phos Na Phos inputevents_mv \n", + "225834 K Phos K Phos inputevents_mv \n", + "227526 Citrate Citrate inputevents_mv \n", + "225925 Potassium Phosphate Potassium Phosphate inputevents_mv \n", + "818 Lactic Acid(0.5-2.0) chartevents \n", + "220955 Ringers Lactate Ringers Lactate inputevents_mv \n", + "2638 CEREBRAL LACTATE chartevents \n", + "1634 lactated ringers chartevents \n", + "30021 Lactated Ringers inputevents_cv \n", + "1520 ACT chartevents \n", + "220507 Activated Clotting Time ACT chartevents \n", + "1671 act chartevents \n", + "221319 Alteplase (TPA) Alteplase (TPA) inputevents_mv \n", + "221347 Amiodarone Amiodarone inputevents_mv \n", + "221342 Aminophylline Aminophylline inputevents_mv \n", + "\n", + " category unitname score \n", + "itemid \n", + "1531 Chemistry 110.000000 \n", + "225668 Labs None 110.000000 \n", + "50813 BLOOD GAS NaN 110.000000 \n", + "220228 Labs g/dl 102.666667 \n", + "2773 102.000000 \n", + "225835 Medications mmol 96.666667 \n", + "225834 Medications mmol 96.666667 \n", + "227526 Medications mmol 96.666667 \n", + "225925 Nutrition - Supplements mmol 96.666667 \n", + "818 Chemistry 91.333333 \n", + "220955 Fluids - Other (Not In Use) mL 86.000000 \n", + "2638 84.000000 \n", + "1634 84.000000 \n", + "30021 84.000000 \n", + "1520 Coags 83.333333 \n", + "220507 Labs None 83.333333 \n", + "1671 83.333333 \n", + "221319 Medications mg 81.333333 \n", + "221347 Medications mg 81.333333 \n", + "221342 Medications mg 81.333333 " + ] + }, + "execution_count": 105, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'lactate',\n", + " 'lactic acid',\n", + " 'mmol/L',\n", + " 'mg/dL'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 106, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.LACTATE] = [1531,50813,225668,818]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Hemoglobin" + ] + }, + { + "cell_type": "code", + "execution_count": 107, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>51222</th>\n", + " <td>HEMOGLOBIN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220228</th>\n", + " <td>Hemoglobin</td>\n", + " <td>Hemoglobin</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>g/dl</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>814</th>\n", + " <td>Hemoglobin</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Hematology</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1165</th>\n", + " <td>Hgb</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50811</th>\n", + " <td>HEMOGLOBIN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51225</th>\n", + " <td>HEMOGLOBIN F</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>104.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51224</th>\n", + " <td>HEMOGLOBIN C</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>104.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50814</th>\n", + " <td>METHEMOGLOBIN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>101.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51223</th>\n", + " <td>HEMOGLOBIN A2</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>101.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7965</th>\n", + " <td>methhemoglobin</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>98.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50852</th>\n", + " <td>% HEMOGLOBIN A1C</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>CHEMISTRY</td>\n", + " <td>NaN</td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51212</th>\n", + " <td>FETAL HEMOGLOBIN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>94.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50805</th>\n", + " <td>CARBOXYHEMOGLOBIN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>92.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50855</th>\n", + " <td>ABSOLUTE HEMOGLOBIN</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>CHEMISTRY</td>\n", + " <td>NaN</td>\n", + " <td>89.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51226</th>\n", + " <td>HEMOGLOBLIN A</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51227</th>\n", + " <td>HEMOGLOBLIN S</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42232</th>\n", + " <td>THYMOGLOBLIN</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45486</th>\n", + " <td>Hemo</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42117</th>\n", + " <td>THYMOGLOBULIN</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>78.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50934</th>\n", + " <td>H</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>CHEMISTRY</td>\n", + " <td>NaN</td>\n", + " <td>76.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto category \\\n", + "itemid \n", + "51222 HEMOGLOBIN NaN labevents HEMATOLOGY \n", + "220228 Hemoglobin Hemoglobin chartevents Labs \n", + "814 Hemoglobin chartevents Hematology \n", + "1165 Hgb chartevents \n", + "50811 HEMOGLOBIN NaN labevents BLOOD GAS \n", + "51225 HEMOGLOBIN F NaN labevents HEMATOLOGY \n", + "51224 HEMOGLOBIN C NaN labevents HEMATOLOGY \n", + "50814 METHEMOGLOBIN NaN labevents BLOOD GAS \n", + "51223 HEMOGLOBIN A2 NaN labevents HEMATOLOGY \n", + "7965 methhemoglobin chartevents \n", + "50852 % HEMOGLOBIN A1C NaN labevents CHEMISTRY \n", + "51212 FETAL HEMOGLOBIN NaN labevents HEMATOLOGY \n", + "50805 CARBOXYHEMOGLOBIN NaN labevents BLOOD GAS \n", + "50855 ABSOLUTE HEMOGLOBIN NaN labevents CHEMISTRY \n", + "51226 HEMOGLOBLIN A NaN labevents HEMATOLOGY \n", + "51227 HEMOGLOBLIN S NaN labevents HEMATOLOGY \n", + "42232 THYMOGLOBLIN inputevents_cv Free Form Intake \n", + "45486 Hemo inputevents_cv \n", + "42117 THYMOGLOBULIN inputevents_cv Free Form Intake \n", + "50934 H NaN labevents CHEMISTRY \n", + "\n", + " unitname score \n", + "itemid \n", + "51222 NaN 110.000000 \n", + "220228 g/dl 110.000000 \n", + "814 110.000000 \n", + "1165 110.000000 \n", + "50811 NaN 110.000000 \n", + "51225 NaN 104.000000 \n", + "51224 NaN 104.000000 \n", + "50814 NaN 101.333333 \n", + "51223 NaN 101.333333 \n", + "7965 98.666667 \n", + "50852 NaN 96.666667 \n", + "51212 NaN 94.666667 \n", + "50805 NaN 92.666667 \n", + "50855 NaN 89.333333 \n", + "51226 NaN 88.000000 \n", + "51227 NaN 88.000000 \n", + "42232 81.333333 \n", + "45486 81.333333 \n", + "42117 78.666667 \n", + "50934 NaN 76.666667 " + ] + }, + "execution_count": 107, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'hgb',\n", + " 'hemoglobin',\n", + " 'g/dL'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 108, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.HEMOGLOBIN] = [51222,220228,814,1165,50811]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Fluids\n", + "\n", + "### Normal Saline" + ] + }, + { + "cell_type": "code", + "execution_count": 109, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>41913</th>\n", + " <td>NS</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6190</th>\n", + " <td>Normal saline</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30143</th>\n", + " <td>3% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>104.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30168</th>\n", + " <td>Normal Saline_GU</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30160</th>\n", + " <td>D5 Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30161</th>\n", + " <td>.3% normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30018</th>\n", + " <td>.9% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30020</th>\n", + " <td>.45% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>101.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30176</th>\n", + " <td>.25% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>101.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30352</th>\n", + " <td>0.9% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220962</th>\n", + " <td>Saline 3%</td>\n", + " <td>Saline 3%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>98.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30353</th>\n", + " <td>0.45% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>98.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44440</th>\n", + " <td>Normal Saline Bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44053</th>\n", + " <td>normal saline bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4647</th>\n", + " <td>normal saline bolus</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43354</th>\n", + " <td>normal saline flushs</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>96.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221213</th>\n", + " <td>Saline 30%</td>\n", + " <td>Saline 30%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>95.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220959</th>\n", + " <td>Saline 0,3%</td>\n", + " <td>Saline 0,3%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>92.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220954</th>\n", + " <td>Saline 0,9%</td>\n", + " <td>Saline 0,9%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>92.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220960</th>\n", + " <td>Saline 0,45%</td>\n", + " <td>Saline 0,45%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>89.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "41913 NS inputevents_cv \n", + "6190 Normal saline chartevents \n", + "30143 3% Normal Saline inputevents_cv \n", + "30168 Normal Saline_GU inputevents_cv \n", + "30160 D5 Normal Saline inputevents_cv \n", + "30161 .3% normal Saline inputevents_cv \n", + "30018 .9% Normal Saline inputevents_cv \n", + "30020 .45% Normal Saline inputevents_cv \n", + "30176 .25% Normal Saline inputevents_cv \n", + "30352 0.9% Normal Saline inputevents_cv \n", + "220962 Saline 3% Saline 3% inputevents_mv \n", + "30353 0.45% Normal Saline inputevents_cv \n", + "44440 Normal Saline Bolus inputevents_cv \n", + "44053 normal saline bolus inputevents_cv \n", + "4647 normal saline bolus chartevents \n", + "43354 normal saline flushs inputevents_cv \n", + "221213 Saline 30% Saline 30% inputevents_mv \n", + "220959 Saline 0,3% Saline 0,3% inputevents_mv \n", + "220954 Saline 0,9% Saline 0,9% inputevents_mv \n", + "220960 Saline 0,45% Saline 0,45% inputevents_mv \n", + "\n", + " category unitname score \n", + "itemid \n", + "41913 Free Form Intake 110.000000 \n", + "6190 110.000000 \n", + "30143 104.333333 \n", + "30168 103.333333 \n", + "30160 103.333333 \n", + "30161 103.333333 \n", + "30018 103.333333 \n", + "30020 101.333333 \n", + "30176 101.333333 \n", + "30352 100.333333 \n", + "220962 Fluids - Other (Not In Use) mL 98.666667 \n", + "30353 98.333333 \n", + "44440 Free Form Intake 97.333333 \n", + "44053 Free Form Intake 97.333333 \n", + "4647 97.333333 \n", + "43354 Free Form Intake 96.000000 \n", + "221213 Fluids - Other (Not In Use) mL 95.000000 \n", + "220959 Fluids - Other (Not In Use) mL 92.000000 \n", + "220954 Fluids - Other (Not In Use) mL 92.000000 \n", + "220960 Fluids - Other (Not In Use) mL 89.333333 " + ] + }, + "execution_count": 109, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'saline',\n", + " 'NS',\n", + " '0.9%',\n", + " 'normal saline'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 110, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.NORMAL_SALINE] = [41913,6190,20018,30252,44440,44053,4647,220954]" + ] + }, + { + "cell_type": "code", + "execution_count": 111, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>41913</th>\n", + " <td>NS</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6190</th>\n", + " <td>Normal saline</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30143</th>\n", + " <td>3% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>104.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30168</th>\n", + " <td>Normal Saline_GU</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30160</th>\n", + " <td>D5 Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30161</th>\n", + " <td>.3% normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30018</th>\n", + " <td>.9% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>103.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30020</th>\n", + " <td>.45% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>101.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30176</th>\n", + " <td>.25% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>101.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30352</th>\n", + " <td>0.9% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>100.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220962</th>\n", + " <td>Saline 3%</td>\n", + " <td>Saline 3%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>98.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30353</th>\n", + " <td>0.45% Normal Saline</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>98.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44440</th>\n", + " <td>Normal Saline Bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44053</th>\n", + " <td>normal saline bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4647</th>\n", + " <td>normal saline bolus</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>43354</th>\n", + " <td>normal saline flushs</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>96.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221213</th>\n", + " <td>Saline 30%</td>\n", + " <td>Saline 30%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>95.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220959</th>\n", + " <td>Saline 0,3%</td>\n", + " <td>Saline 0,3%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>92.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220954</th>\n", + " <td>Saline 0,9%</td>\n", + " <td>Saline 0,9%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>92.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220960</th>\n", + " <td>Saline 0,45%</td>\n", + " <td>Saline 0,45%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>89.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220961</th>\n", + " <td>Saline 0,65%</td>\n", + " <td>Saline 0,65%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>89.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221212</th>\n", + " <td>Saline 0,18%</td>\n", + " <td>Saline 0,18%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>89.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>41392</th>\n", + " <td>ns b</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225825</th>\n", + " <td>D5NS</td>\n", + " <td>D5NS</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5333</th>\n", + " <td>saline flush</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30060</th>\n", + " <td>D5NS</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>226401</th>\n", + " <td>GU Irrigant - Normal Saline</td>\n", + " <td>GU Irrigant - Normal Saline</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>87.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220958</th>\n", + " <td>Saline 0,255%</td>\n", + " <td>Saline 0,255%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>86.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2619</th>\n", + " <td>3% NS</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>227344</th>\n", + " <td>IV/Saline lock</td>\n", + " <td>IV/Saline lock</td>\n", + " <td></td>\n", + " <td>Restraint/Support Systems</td>\n", + " <td></td>\n", + " <td>83.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30190</th>\n", + " <td>NS .9%</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>82.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225158</th>\n", + " <td>NaCl 0.9%</td>\n", + " <td>NaCl 0.9%</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>82.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45298</th>\n", + " <td>ED NS</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2072</th>\n", + " <td>Pinsp</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2107</th>\n", + " <td>pinsp</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7092</th>\n", + " <td>Tinsp</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6384</th>\n", + " <td>PINSP</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44498</th>\n", + " <td>er ns</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3204</th>\n", + " <td>Pinsp.</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2404</th>\n", + " <td>.45%ns</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>79.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "41913 NS \n", + "6190 Normal saline \n", + "30143 3% Normal Saline \n", + "30168 Normal Saline_GU \n", + "30160 D5 Normal Saline \n", + "30161 .3% normal Saline \n", + "30018 .9% Normal Saline \n", + "30020 .45% Normal Saline \n", + "30176 .25% Normal Saline \n", + "30352 0.9% Normal Saline \n", + "220962 Saline 3% Saline 3% \n", + "30353 0.45% Normal Saline \n", + "44440 Normal Saline Bolus \n", + "44053 normal saline bolus \n", + "4647 normal saline bolus \n", + "43354 normal saline flushs \n", + "221213 Saline 30% Saline 30% \n", + "220959 Saline 0,3% Saline 0,3% \n", + "220954 Saline 0,9% Saline 0,9% \n", + "220960 Saline 0,45% Saline 0,45% \n", + "220961 Saline 0,65% Saline 0,65% \n", + "221212 Saline 0,18% Saline 0,18% \n", + "41392 ns b \n", + "225825 D5NS D5NS \n", + "5333 saline flush \n", + "30060 D5NS \n", + "226401 GU Irrigant - Normal Saline GU Irrigant - Normal Saline \n", + "220958 Saline 0,255% Saline 0,255% \n", + "2619 3% NS \n", + "227344 IV/Saline lock IV/Saline lock \n", + "30190 NS .9% \n", + "225158 NaCl 0.9% NaCl 0.9% \n", + "45298 ED NS \n", + "2072 Pinsp \n", + "2107 pinsp \n", + "7092 Tinsp \n", + "6384 PINSP \n", + "44498 er ns \n", + "3204 Pinsp. \n", + "2404 .45%ns \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "41913 inputevents_cv Free Form Intake 110.000000 \n", + "6190 chartevents 110.000000 \n", + "30143 inputevents_cv 104.333333 \n", + "30168 inputevents_cv 103.333333 \n", + "30160 inputevents_cv 103.333333 \n", + "30161 inputevents_cv 103.333333 \n", + "30018 inputevents_cv 103.333333 \n", + "30020 inputevents_cv 101.333333 \n", + "30176 inputevents_cv 101.333333 \n", + "30352 inputevents_cv 100.333333 \n", + "220962 inputevents_mv Fluids - Other (Not In Use) mL 98.666667 \n", + "30353 inputevents_cv 98.333333 \n", + "44440 inputevents_cv Free Form Intake 97.333333 \n", + "44053 inputevents_cv Free Form Intake 97.333333 \n", + "4647 chartevents 97.333333 \n", + "43354 inputevents_cv Free Form Intake 96.000000 \n", + "221213 inputevents_mv Fluids - Other (Not In Use) mL 95.000000 \n", + "220959 inputevents_mv Fluids - Other (Not In Use) mL 92.000000 \n", + "220954 inputevents_mv Fluids - Other (Not In Use) mL 92.000000 \n", + "220960 inputevents_mv Fluids - Other (Not In Use) mL 89.333333 \n", + "220961 inputevents_mv Fluids - Other (Not In Use) mL 89.333333 \n", + "221212 inputevents_mv Fluids - Other (Not In Use) mL 89.333333 \n", + "41392 inputevents_cv Free Form Intake 88.000000 \n", + "225825 inputevents_mv Fluids/Intake mL 88.000000 \n", + "5333 chartevents 88.000000 \n", + "30060 inputevents_cv 88.000000 \n", + "226401 inputevents_mv Fluids/Intake mL 87.666667 \n", + "220958 inputevents_mv Fluids - Other (Not In Use) mL 86.666667 \n", + "2619 chartevents 84.666667 \n", + "227344 Restraint/Support Systems 83.333333 \n", + "30190 inputevents_cv 82.333333 \n", + "225158 inputevents_mv Fluids/Intake mL 82.333333 \n", + "45298 inputevents_cv Free Form Intake 81.333333 \n", + "2072 chartevents 81.333333 \n", + "2107 chartevents 81.333333 \n", + "7092 chartevents 81.333333 \n", + "6384 chartevents 81.333333 \n", + "44498 inputevents_cv Free Form Intake 81.333333 \n", + "3204 chartevents 79.000000 \n", + "2404 chartevents 79.000000 " + ] + }, + "execution_count": 111, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df.head(40)" + ] + }, + { + "cell_type": "code", + "execution_count": 112, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.NORMAL_SALINE] += [30190,225158]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Lactated Ringers" + ] + }, + { + "cell_type": "code", + "execution_count": 113, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>225828</th>\n", + " <td>LR</td>\n", + " <td>LR</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44367</th>\n", + " <td>LR</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2971</th>\n", + " <td>LR</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1634</th>\n", + " <td>lactated ringers</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30021</th>\n", + " <td>Lactated Ringers</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45532</th>\n", + " <td>IR Lactated ringers</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>104.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225943</th>\n", + " <td>Solution</td>\n", + " <td>Solution</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225827</th>\n", + " <td>D5LR</td>\n", + " <td>D5LR</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50813</th>\n", + " <td>LACTATE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220953</th>\n", + " <td>Ringers</td>\n", + " <td>Ringers</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46207</th>\n", + " <td>OR LR</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44184</th>\n", + " <td>LR Bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44521</th>\n", + " <td>LR bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46781</th>\n", + " <td>lr bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44815</th>\n", + " <td>LR BOLUS</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44915</th>\n", + " <td>D5LR 40K</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46538</th>\n", + " <td>PD solution in</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>68.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44837</th>\n", + " <td>ED URINE</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>68.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8313</th>\n", + " <td>Nystatin solution</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30125</th>\n", + " <td>Milrinone</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "225828 LR LR inputevents_mv \n", + "44367 LR inputevents_cv \n", + "2971 LR chartevents \n", + "1634 lactated ringers chartevents \n", + "30021 Lactated Ringers inputevents_cv \n", + "45532 IR Lactated ringers inputevents_cv \n", + "225943 Solution Solution inputevents_mv \n", + "225827 D5LR D5LR inputevents_mv \n", + "50813 LACTATE NaN labevents \n", + "220953 Ringers Ringers inputevents_mv \n", + "46207 OR LR inputevents_cv \n", + "44184 LR Bolus inputevents_cv \n", + "44521 LR bolus inputevents_cv \n", + "46781 lr bolus inputevents_cv \n", + "44815 LR BOLUS inputevents_cv \n", + "44915 D5LR 40K inputevents_cv \n", + "46538 PD solution in inputevents_cv \n", + "44837 ED URINE outputevents \n", + "8313 Nystatin solution chartevents \n", + "30125 Milrinone inputevents_cv \n", + "\n", + " category unitname score \n", + "itemid \n", + "225828 Fluids/Intake mL 110.000000 \n", + "44367 Free Form Intake 110.000000 \n", + "2971 110.000000 \n", + "1634 110.000000 \n", + "30021 110.000000 \n", + "45532 Free Form Intake 104.000000 \n", + "225943 Fluids/Intake mL 88.000000 \n", + "225827 Fluids/Intake mL 88.000000 \n", + "50813 BLOOD GAS NaN 84.000000 \n", + "220953 Fluids - Other (Not In Use) mL 84.000000 \n", + "46207 Free Form Intake 81.333333 \n", + "44184 Free Form Intake 70.000000 \n", + "44521 Free Form Intake 70.000000 \n", + "46781 Free Form Intake 70.000000 \n", + "44815 Free Form Intake 70.000000 \n", + "44915 Free Form Intake 70.000000 \n", + "46538 Free Form Intake 68.333333 \n", + "44837 68.000000 \n", + "8313 67.666667 \n", + "30125 67.333333 " + ] + }, + "execution_count": 113, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'LR',\n", + " 'ringers solution',\n", + " 'lactated ringers'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 114, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>225828</th>\n", + " <td>LR</td>\n", + " <td>LR</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44367</th>\n", + " <td>LR</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2971</th>\n", + " <td>LR</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1634</th>\n", + " <td>lactated ringers</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30021</th>\n", + " <td>Lactated Ringers</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45532</th>\n", + " <td>IR Lactated ringers</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>104.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225943</th>\n", + " <td>Solution</td>\n", + " <td>Solution</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225827</th>\n", + " <td>D5LR</td>\n", + " <td>D5LR</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids/Intake</td>\n", + " <td>mL</td>\n", + " <td>88.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50813</th>\n", + " <td>LACTATE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220953</th>\n", + " <td>Ringers</td>\n", + " <td>Ringers</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>84.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46207</th>\n", + " <td>OR LR</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>81.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44184</th>\n", + " <td>LR Bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44521</th>\n", + " <td>LR bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46781</th>\n", + " <td>lr bolus</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44815</th>\n", + " <td>LR BOLUS</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44915</th>\n", + " <td>D5LR 40K</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46538</th>\n", + " <td>PD solution in</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>68.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44837</th>\n", + " <td>ED URINE</td>\n", + " <td></td>\n", + " <td>outputevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>68.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8313</th>\n", + " <td>Nystatin solution</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30125</th>\n", + " <td>Milrinone</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221986</th>\n", + " <td>Milrinone</td>\n", + " <td>Milrinone</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>67.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30159</th>\n", + " <td>D5 Ringers Lact.</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>67.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228159</th>\n", + " <td>Purge Solution Flow Rate</td>\n", + " <td>Purge Solution Flow Rate</td>\n", + " <td>chartevents</td>\n", + " <td>Impella</td>\n", + " <td>ml/hr</td>\n", + " <td>66.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225953</th>\n", + " <td>Solution (Peritoneal Dialysis)</td>\n", + " <td>Solution (PD)</td>\n", + " <td></td>\n", + " <td>Dialysis</td>\n", + " <td></td>\n", + " <td>66.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45983</th>\n", + " <td>Pitocin/LR</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>65.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42409</th>\n", + " <td>D5LR W/40K</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>65.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42978</th>\n", + " <td>D5LR 20KCL</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>65.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1189</th>\n", + " <td>finger stick</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>65.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5743</th>\n", + " <td>NT suction</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>64.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1520</th>\n", + " <td>ACT</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td>Coags</td>\n", + " <td></td>\n", + " <td>64.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220507</th>\n", + " <td>Activated Clotting Time</td>\n", + " <td>ACT</td>\n", + " <td>chartevents</td>\n", + " <td>Labs</td>\n", + " <td>None</td>\n", + " <td>64.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1671</th>\n", + " <td>act</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>64.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8339</th>\n", + " <td>Neo Opium Solution</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>64.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42288</th>\n", + " <td>LR w/40 kcl</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>64.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225072</th>\n", + " <td>Living situation</td>\n", + " <td>Living situation</td>\n", + " <td></td>\n", + " <td>Adm History/FHPA</td>\n", + " <td></td>\n", + " <td>63.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42345</th>\n", + " <td>LR w/ 40 mEq</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2773</th>\n", + " <td>sjlactate</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5088</th>\n", + " <td>fingers</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42265</th>\n", + " <td>LR W/ 20 KCL</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>63.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>220955</th>\n", + " <td>Ringers Lactate</td>\n", + " <td>Ringers Lactate</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Fluids - Other (Not In Use)</td>\n", + " <td>mL</td>\n", + " <td>63.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation \\\n", + "itemid \n", + "225828 LR LR \n", + "44367 LR \n", + "2971 LR \n", + "1634 lactated ringers \n", + "30021 Lactated Ringers \n", + "45532 IR Lactated ringers \n", + "225943 Solution Solution \n", + "225827 D5LR D5LR \n", + "50813 LACTATE NaN \n", + "220953 Ringers Ringers \n", + "46207 OR LR \n", + "44184 LR Bolus \n", + "44521 LR bolus \n", + "46781 lr bolus \n", + "44815 LR BOLUS \n", + "44915 D5LR 40K \n", + "46538 PD solution in \n", + "44837 ED URINE \n", + "8313 Nystatin solution \n", + "30125 Milrinone \n", + "221986 Milrinone Milrinone \n", + "30159 D5 Ringers Lact. \n", + "228159 Purge Solution Flow Rate Purge Solution Flow Rate \n", + "225953 Solution (Peritoneal Dialysis) Solution (PD) \n", + "45983 Pitocin/LR \n", + "42409 D5LR W/40K \n", + "42978 D5LR 20KCL \n", + "1189 finger stick \n", + "5743 NT suction \n", + "1520 ACT \n", + "220507 Activated Clotting Time ACT \n", + "1671 act \n", + "8339 Neo Opium Solution \n", + "42288 LR w/40 kcl \n", + "225072 Living situation Living situation \n", + "42345 LR w/ 40 mEq \n", + "2773 sjlactate \n", + "5088 fingers \n", + "42265 LR W/ 20 KCL \n", + "220955 Ringers Lactate Ringers Lactate \n", + "\n", + " linksto category unitname score \n", + "itemid \n", + "225828 inputevents_mv Fluids/Intake mL 110.000000 \n", + "44367 inputevents_cv Free Form Intake 110.000000 \n", + "2971 chartevents 110.000000 \n", + "1634 chartevents 110.000000 \n", + "30021 inputevents_cv 110.000000 \n", + "45532 inputevents_cv Free Form Intake 104.000000 \n", + "225943 inputevents_mv Fluids/Intake mL 88.000000 \n", + "225827 inputevents_mv Fluids/Intake mL 88.000000 \n", + "50813 labevents BLOOD GAS NaN 84.000000 \n", + "220953 inputevents_mv Fluids - Other (Not In Use) mL 84.000000 \n", + "46207 inputevents_cv Free Form Intake 81.333333 \n", + "44184 inputevents_cv Free Form Intake 70.000000 \n", + "44521 inputevents_cv Free Form Intake 70.000000 \n", + "46781 inputevents_cv Free Form Intake 70.000000 \n", + "44815 inputevents_cv Free Form Intake 70.000000 \n", + "44915 inputevents_cv Free Form Intake 70.000000 \n", + "46538 inputevents_cv Free Form Intake 68.333333 \n", + "44837 outputevents 68.000000 \n", + "8313 chartevents 67.666667 \n", + "30125 inputevents_cv 67.333333 \n", + "221986 inputevents_mv Medications mg 67.333333 \n", + "30159 inputevents_cv 67.333333 \n", + "228159 chartevents Impella ml/hr 66.666667 \n", + "225953 Dialysis 66.000000 \n", + "45983 inputevents_cv Free Form Intake 65.333333 \n", + "42409 inputevents_cv Free Form Intake 65.333333 \n", + "42978 inputevents_cv Free Form Intake 65.333333 \n", + "1189 chartevents 65.000000 \n", + "5743 chartevents 64.666667 \n", + "1520 chartevents Coags 64.666667 \n", + "220507 chartevents Labs None 64.666667 \n", + "1671 chartevents 64.666667 \n", + "8339 chartevents 64.333333 \n", + "42288 inputevents_cv Free Form Intake 64.000000 \n", + "225072 Adm History/FHPA 63.666667 \n", + "42345 inputevents_cv Free Form Intake 63.333333 \n", + "2773 chartevents 63.333333 \n", + "5088 chartevents 63.333333 \n", + "42265 inputevents_cv Free Form Intake 63.333333 \n", + "220955 inputevents_mv Fluids - Other (Not In Use) mL 63.000000 " + ] + }, + "execution_count": 114, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df.head(40)" + ] + }, + { + "cell_type": "code", + "execution_count": 115, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.LACTATED_RINGERS] = [225828,44367,2971,1634,30021,220953,46207,44184,44521,46781,44815]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Pressors" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Norepinephrine" + ] + }, + { + "cell_type": "code", + "execution_count": 117, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>30047</th>\n", + " <td>Levophed</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221906</th>\n", + " <td>Norepinephrine</td>\n", + " <td>Norepinephrine</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30120</th>\n", + " <td>Levophed-k</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>102.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30044</th>\n", + " <td>Epinephrine</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>102.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>221289</th>\n", + " <td>Epinephrine</td>\n", + " <td>Epinephrine</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>mg</td>\n", + " <td>102.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5752</th>\n", + " <td>Epinephrin</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>98.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51201</th>\n", + " <td>EPINEPHERINE</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>88.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30119</th>\n", + " <td>Epinephrine-k</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>84.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30309</th>\n", + " <td>Epinephrine Drip</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>77.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30127</th>\n", + " <td>Neosynephrine</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>72.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>225922</th>\n", + " <td>Nephramine</td>\n", + " <td>Nephramine</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Nutrition - Supplements</td>\n", + " <td>mL</td>\n", + " <td>71.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3112</th>\n", + " <td>epinephrine mcg/min</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>71.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50820</th>\n", + " <td>PH</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51491</th>\n", + " <td>PH</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>HEMATOLOGY</td>\n", + " <td>NaN</td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>51094</th>\n", + " <td>PH</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>CHEMISTRY</td>\n", + " <td>NaN</td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50831</th>\n", + " <td>PH</td>\n", + " <td>NaN</td>\n", + " <td>labevents</td>\n", + " <td>BLOOD GAS</td>\n", + " <td>NaN</td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45183</th>\n", + " <td>ED</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7459</th>\n", + " <td>Ph</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1673</th>\n", + " <td>PH</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>70.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>30128</th>\n", + " <td>Neosynephrine-k</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>69.666667</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "30047 Levophed inputevents_cv \n", + "221906 Norepinephrine Norepinephrine inputevents_mv \n", + "30120 Levophed-k inputevents_cv \n", + "30044 Epinephrine inputevents_cv \n", + "221289 Epinephrine Epinephrine inputevents_mv \n", + "5752 Epinephrin chartevents \n", + "51201 EPINEPHERINE NaN labevents \n", + "30119 Epinephrine-k inputevents_cv \n", + "30309 Epinephrine Drip inputevents_cv \n", + "30127 Neosynephrine inputevents_cv \n", + "225922 Nephramine Nephramine inputevents_mv \n", + "3112 epinephrine mcg/min chartevents \n", + "50820 PH NaN labevents \n", + "51491 PH NaN labevents \n", + "51094 PH NaN labevents \n", + "50831 PH NaN labevents \n", + "45183 ED inputevents_cv \n", + "7459 Ph chartevents \n", + "1673 PH chartevents \n", + "30128 Neosynephrine-k inputevents_cv \n", + "\n", + " category unitname score \n", + "itemid \n", + "30047 110.000000 \n", + "221906 Medications mg 110.000000 \n", + "30120 102.666667 \n", + "30044 102.000000 \n", + "221289 Medications mg 102.000000 \n", + "5752 98.666667 \n", + "51201 HEMATOLOGY NaN 88.666667 \n", + "30119 84.666667 \n", + "30309 77.333333 \n", + "30127 72.333333 \n", + "225922 Nutrition - Supplements mL 71.333333 \n", + "3112 71.000000 \n", + "50820 BLOOD GAS NaN 70.000000 \n", + "51491 HEMATOLOGY NaN 70.000000 \n", + "51094 CHEMISTRY NaN 70.000000 \n", + "50831 BLOOD GAS NaN 70.000000 \n", + "45183 Free Form Intake 70.000000 \n", + "7459 70.000000 \n", + "1673 70.000000 \n", + "30128 69.666667 " + ] + }, + "execution_count": 117, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'levophed',\n", + " 'norepinephrine'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 118, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.NOREPINEPHRINE] = [30047,221906,30120]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Vasopressin" + ] + }, + { + "cell_type": "code", + "execution_count": 119, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>abbreviation</th>\n", + " <th>linksto</th>\n", + " <th>category</th>\n", + " <th>unitname</th>\n", + " <th>score</th>\n", + " </tr>\n", + " <tr>\n", + " <th>itemid</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>30051</th>\n", + " <td>Vasopressin</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2445</th>\n", + " <td>Vasopressin</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>222315</th>\n", + " <td>Vasopressin</td>\n", + " <td>Vasopressin</td>\n", + " <td>inputevents_mv</td>\n", + " <td>Medications</td>\n", + " <td>units</td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1136</th>\n", + " <td>vasopressin</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1222</th>\n", + " <td>VASOPRESSIN</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>110.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2334</th>\n", + " <td>vasopressin u/hr</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2561</th>\n", + " <td>VASOPRESSIN U/HR</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>97.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7341</th>\n", + " <td>Vasopressin u/hr</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>96.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46570</th>\n", + " <td>vassopressin</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>94.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42802</th>\n", + " <td>VASOPRESSIN CC/HR.</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>94.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6255</th>\n", + " <td>VAsopressin 0.04 s</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>92.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2765</th>\n", + " <td>VASOPRESSIN UNIT/R</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>92.333333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2248</th>\n", + " <td>VASOPRESSIN UNIT/MIN</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>42273</th>\n", + " <td>vasopressin unit/min</td>\n", + " <td></td>\n", + " <td>inputevents_cv</td>\n", + " <td>Free Form Intake</td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1327</th>\n", + " <td>vasopressin unit/min</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>90.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6269</th>\n", + " <td>Dressing</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>68.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>46</th>\n", + " <td>Angio Dressing #2</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>68.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6691</th>\n", + " <td>DRIV PRESS</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>68.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>45</th>\n", + " <td>Angio Dressing #1</td>\n", + " <td></td>\n", + " <td>chartevents</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>68.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>228448</th>\n", + " <td>Angio Dressing # 4</td>\n", + " <td>Angio Dressing # 4</td>\n", + " <td></td>\n", + " <td>Cardiovascular</td>\n", + " <td></td>\n", + " <td>67.333333</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label abbreviation linksto \\\n", + "itemid \n", + "30051 Vasopressin inputevents_cv \n", + "2445 Vasopressin chartevents \n", + "222315 Vasopressin Vasopressin inputevents_mv \n", + "1136 vasopressin chartevents \n", + "1222 VASOPRESSIN chartevents \n", + "2334 vasopressin u/hr chartevents \n", + "2561 VASOPRESSIN U/HR chartevents \n", + "7341 Vasopressin u/hr chartevents \n", + "46570 vassopressin inputevents_cv \n", + "42802 VASOPRESSIN CC/HR. inputevents_cv \n", + "6255 VAsopressin 0.04 s chartevents \n", + "2765 VASOPRESSIN UNIT/R chartevents \n", + "2248 VASOPRESSIN UNIT/MIN chartevents \n", + "42273 vasopressin unit/min inputevents_cv \n", + "1327 vasopressin unit/min chartevents \n", + "6269 Dressing chartevents \n", + "46 Angio Dressing #2 chartevents \n", + "6691 DRIV PRESS chartevents \n", + "45 Angio Dressing #1 chartevents \n", + "228448 Angio Dressing # 4 Angio Dressing # 4 \n", + "\n", + " category unitname score \n", + "itemid \n", + "30051 110.000000 \n", + "2445 110.000000 \n", + "222315 Medications units 110.000000 \n", + "1136 110.000000 \n", + "1222 110.000000 \n", + "2334 97.333333 \n", + "2561 97.333333 \n", + "7341 96.666667 \n", + "46570 Free Form Intake 94.333333 \n", + "42802 Free Form Intake 94.000000 \n", + "6255 92.333333 \n", + "2765 92.333333 \n", + "2248 90.666667 \n", + "42273 Free Form Intake 90.666667 \n", + "1327 90.666667 \n", + "6269 68.666667 \n", + "46 68.000000 \n", + "6691 68.000000 \n", + "45 68.000000 \n", + "228448 Cardiovascular 67.333333 " + ] + }, + "execution_count": 119, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df = explorer.search([\n", + " 'vasopressin',\n", + " 'argipressin',\n", + " 'arginine vasopressin'\n", + " ])\n", + "out_df.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 120, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "keep_dict[data_dict.labels.VASOPRESSIN] = out_df.loc[:1327].index.tolist()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Now build our mapping dataframe" + ] + }, + { + "cell_type": "code", + "execution_count": 124, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import pandas as pd\n", + "from itertools import product" + ] + }, + { + "cell_type": "code", + "execution_count": 131, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "tuples = []\n", + "\n", + "for label,items in keep_dict.iteritems():\n", + " tuples += list(product([label],items))\n", + "\n", + "item_map = pd.DataFrame(tuples,columns=['label','itemid'])" + ] + }, + { + "cell_type": "code", + "execution_count": 132, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>glasgow coma scale eye opening</td>\n", + " <td>184</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>glasgow coma scale eye opening</td>\n", + " <td>220739</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>glasgow coma scale motor</td>\n", + " <td>454</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>glasgow coma scale motor</td>\n", + " <td>223901</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>blood pressure systolic</td>\n", + " <td>220179</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " label itemid\n", + "0 glasgow coma scale eye opening 184\n", + "1 glasgow coma scale eye opening 220739\n", + "2 glasgow coma scale motor 454\n", + "3 glasgow coma scale motor 223901\n", + "4 blood pressure systolic 220179" + ] + }, + "execution_count": 132, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "item_map.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 133, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "item_map.to_csv('config/mimic_item_map.csv',index=False)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Extract MIMIC III data" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import mimic\n", + "from constants import ALL\n", + "import icu_data_defs \n", + "import utils\n", + "import logger\n", + "import warnings\n", + "warnings.filterwarnings('ignore')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(icu_data_defs)\n", + "reload(mimic)\n", + "reload(logger)\n", + "\n", + "def extract_labels(conn,labels,item_map_fname,hdf5_fname,hadm_ids=ALL):\n", + " logger.log('Start extracting {} labels'.format(len(labels)),new_level=True)\n", + " extractor = mimic.mimic_extractor(conn,item_map_fname)\n", + " for label in labels:\n", + " logger.log(label.upper(),new_level=True)\n", + " df = extractor.extract_label(label,hadm_ids)\n", + " if df is None: continue\n", + " utils.save_df(df,hdf5_fname,'extract/{}'.format(label))\n", + " display(df.head())\n", + " print df.shape\n", + " del df\n", + " logger.end_log()\n", + " return \n", + "\n", + "#connect to the mimic database\n", + "conn = mimic.connect()\n", + "\n", + "#these are the default config files we will be using\n", + "item_map_fname = 'config/mimic_item_map.csv'\n", + "mimic_data_sef_fname = 'config/data_definitions.xlsx'\n", + "\n", + "#get all labels\n", + "data_dict = icu_data_defs.data_dictionary(mimic_data_sef_fname)\n", + "simple_data = data_dict.get_panel_defintions(12) #12 is \"simple data\"\n", + "labels = simple_data.label.unique().tolist()\n", + "\n", + "#where we will be storing this extraction\n", + "hdf5_fname = 'data/mimic_data'" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 03:26:58) Start extracting 5 labels\n", + "(2017-06-03 03:26:58)>> HEART RATE\n", + "(2017-06-03 03:26:59)>>>> Extracting 5 items from chartevents\n", + "(2017-06-03 03:26:59)<<<< DONE (0.0s)\n", + "(2017-06-03 03:26:59)>>>> Combine DF\n", + "(2017-06-03 03:26:59)<<<< DONE (0.0s)\n", + "(2017-06-03 03:26:59)>>>> Clean UOM\n", + "(2017-06-03 03:26:59)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 00:00:00</td>\n", + " <td>62</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 00:30:00</td>\n", + " <td>67</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 01:00:00</td>\n", + " <td>67</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 01:20:00</td>\n", + " <td>63</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 01:25:00</td>\n", + " <td>63</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 143838 2129-07-14 00:00:00 62 beat/min 211\n", + "1 143838 2129-07-14 00:30:00 67 beat/min 211\n", + "2 143838 2129-07-14 01:00:00 67 beat/min 211\n", + "3 143838 2129-07-14 01:20:00 63 beat/min 211\n", + "4 143838 2129-07-14 01:25:00 63 beat/min 211" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(1649, 5)\n", + "(2017-06-03 03:27:01)<< DONE (3.0s)\n", + "(2017-06-03 03:27:01)>> BLOOD PRESSURE SYSTOLIC\n", + "(2017-06-03 03:27:01)>>>> Extracting 14 items from chartevents\n", + "(2017-06-03 03:27:02)<<<< DONE (1.0s)\n", + "(2017-06-03 03:27:02)>>>> Combine DF\n", + "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n", + "(2017-06-03 03:27:02)>>>> Clean UOM\n", + "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>143838</td>\n", + " <td>2129-07-13 22:40:00</td>\n", + " <td>145</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>143838</td>\n", + " <td>2129-07-13 23:00:00</td>\n", + " <td>136</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>143838</td>\n", + " <td>2129-07-13 23:30:00</td>\n", + " <td>179</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 00:00:00</td>\n", + " <td>131</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 00:30:00</td>\n", + " <td>146</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 143838 2129-07-13 22:40:00 145 mmHg 51\n", + "1 143838 2129-07-13 23:00:00 136 mmHg 51\n", + "2 143838 2129-07-13 23:30:00 179 mmHg 51\n", + "3 143838 2129-07-14 00:00:00 131 mmHg 51\n", + "4 143838 2129-07-14 00:30:00 146 mmHg 51" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(644, 5)\n", + "(2017-06-03 03:27:02)<< DONE (1.0s)\n", + "(2017-06-03 03:27:02)>> BLOOD PRESSURE DIASTOLIC\n", + "(2017-06-03 03:27:02)>>>> Extracting 15 items from chartevents\n", + "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n", + "(2017-06-03 03:27:02)>>>> Combine DF\n", + "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n", + "(2017-06-03 03:27:02)>>>> Clean UOM\n", + "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 21:00:00</td>\n", + " <td>53</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 14:00:00</td>\n", + " <td>84</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 10:30:00</td>\n", + " <td>54</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 15:00:00</td>\n", + " <td>60</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 16:00:00</td>\n", + " <td>59</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 113540 2161-10-12 21:00:00 53 mmHg 220051\n", + "1 113540 2161-10-12 14:00:00 84 mmHg 220051\n", + "2 113540 2161-10-12 10:30:00 54 mmHg 220051\n", + "3 113540 2161-10-12 15:00:00 60 mmHg 220051\n", + "4 113540 2161-10-12 16:00:00 59 mmHg 220051" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(640, 5)\n", + "(2017-06-03 03:27:02)<< DONE (0.0s)\n", + "(2017-06-03 03:27:02)>> BLOOD PRESSURE MEAN\n", + "(2017-06-03 03:27:03)>>>> Extracting 3 items from chartevents\n", + "(2017-06-03 03:27:03)<<<< DONE (0.0s)\n", + "(2017-06-03 03:27:03)>>>> Combine DF\n", + "(2017-06-03 03:27:03)<<<< DONE (0.0s)\n", + "(2017-06-03 03:27:03)>>>> Clean UOM\n", + "(2017-06-03 03:27:03)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 21:00:00</td>\n", + " <td>76</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 12:00:00</td>\n", + " <td>91</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 14:00:00</td>\n", + " <td>82</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 10:30:00</td>\n", + " <td>70</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>113540</td>\n", + " <td>2161-10-12 15:00:00</td>\n", + " <td>80</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 113540 2161-10-12 21:00:00 76 mmHg 220052\n", + "1 113540 2161-10-12 12:00:00 91 mmHg 220052\n", + "2 113540 2161-10-12 14:00:00 82 mmHg 220052\n", + "3 113540 2161-10-12 10:30:00 70 mmHg 220052\n", + "4 113540 2161-10-12 15:00:00 80 mmHg 220052" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(58, 5)\n", + "(2017-06-03 03:27:03)<< DONE (1.0s)\n", + "(2017-06-03 03:27:03)>> RESPIRATORY RATE\n", + "(2017-06-03 03:27:03)>>>> Extracting 4 items from chartevents\n", + "(2017-06-03 03:27:04)<<<< DONE (1.0s)\n", + "(2017-06-03 03:27:04)>>>> Combine DF\n", + "(2017-06-03 03:27:04)<<<< DONE (0.0s)\n", + "(2017-06-03 03:27:04)>>>> Clean UOM\n", + "(2017-06-03 03:27:04)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>143838</td>\n", + " <td>2129-07-13 23:30:00</td>\n", + " <td>17</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 00:00:00</td>\n", + " <td>20</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 00:30:00</td>\n", + " <td>17</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 01:00:00</td>\n", + " <td>13</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>143838</td>\n", + " <td>2129-07-14 01:20:00</td>\n", + " <td>15</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 143838 2129-07-13 23:30:00 17 breath/min 618\n", + "1 143838 2129-07-14 00:00:00 20 breath/min 618\n", + "2 143838 2129-07-14 00:30:00 17 breath/min 618\n", + "3 143838 2129-07-14 01:00:00 13 breath/min 618\n", + "4 143838 2129-07-14 01:20:00 15 breath/min 618" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(1647, 5)\n", + "(2017-06-03 03:27:04)<< DONE (1.0s)\n", + "(2017-06-03 03:27:04) DONE (6.0s)\n" + ] + } + ], + "source": [ + "hadm_ids = mimic.sample_hadm_ids(5,conn)\n", + "extract_labels(conn,labels[0:5],item_map_fname,hdf5_fname,hadm_ids)" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 03:27:10) Start extracting 18 labels\n", + "(2017-06-03 03:27:10)>> HEART RATE\n", + "(2017-06-03 03:27:10)>>>> Extracting 5 items from chartevents\n", + "(2017-06-03 03:28:03)<<<< DONE (53.0s)\n", + "(2017-06-03 03:28:03)>>>> Combine DF\n", + "(2017-06-03 03:28:03)<<<< DONE (0.0s)\n", + "(2017-06-03 03:28:03)>>>> Clean UOM\n", + "(2017-06-03 03:28:07)<<<< DONE (4.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-26 03:00:00</td>\n", + " <td>79</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-02 06:00:00</td>\n", + " <td>116</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-02 07:00:00</td>\n", + " <td>116</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-02 08:00:00</td>\n", + " <td>144</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-03 08:00:00</td>\n", + " <td>144</td>\n", + " <td>beat/min</td>\n", + " <td>211</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-26 03:00:00 79 beat/min 211\n", + "1 106266.0 2114-12-02 06:00:00 116 beat/min 211\n", + "2 106266.0 2114-12-02 07:00:00 116 beat/min 211\n", + "3 106266.0 2114-12-02 08:00:00 144 beat/min 211\n", + "4 106266.0 2114-12-03 08:00:00 144 beat/min 211" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(7952939, 5)\n", + "(2017-06-03 03:28:20)<< DONE (70.0s)\n", + "(2017-06-03 03:28:20)>> BLOOD PRESSURE SYSTOLIC\n", + "(2017-06-03 03:28:21)>>>> Extracting 14 items from chartevents\n", + "(2017-06-03 03:29:45)<<<< DONE (84.0s)\n", + "(2017-06-03 03:29:45)>>>> Combine DF\n", + "(2017-06-03 03:29:45)<<<< DONE (0.0s)\n", + "(2017-06-03 03:29:45)>>>> Clean UOM\n", + "(2017-06-03 03:29:48)<<<< DONE (3.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>176203.0</td>\n", + " <td>2154-11-12 22:00:00</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>197569.0</td>\n", + " <td>2133-03-09 00:00:00</td>\n", + " <td>117</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>197569.0</td>\n", + " <td>2133-03-09 01:00:00</td>\n", + " <td>117</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>197569.0</td>\n", + " <td>2133-03-09 02:00:00</td>\n", + " <td>127</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>197569.0</td>\n", + " <td>2133-03-09 03:00:00</td>\n", + " <td>126</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 176203.0 2154-11-12 22:00:00 51\n", + "1 197569.0 2133-03-09 00:00:00 117 mmHg 51\n", + "2 197569.0 2133-03-09 01:00:00 117 mmHg 51\n", + "3 197569.0 2133-03-09 02:00:00 127 mmHg 51\n", + "4 197569.0 2133-03-09 03:00:00 126 mmHg 51" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(6374824, 5)\n", + "(2017-06-03 03:30:00)<< DONE (100.0s)\n", + "(2017-06-03 03:30:00)>> BLOOD PRESSURE DIASTOLIC\n", + "(2017-06-03 03:30:00)>>>> Extracting 15 items from chartevents\n", + "(2017-06-03 03:31:18)<<<< DONE (78.0s)\n", + "(2017-06-03 03:31:18)>>>> Combine DF\n", + "(2017-06-03 03:31:19)<<<< DONE (1.0s)\n", + "(2017-06-03 03:31:19)>>>> Clean UOM\n", + "(2017-06-03 03:31:22)<<<< DONE (3.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>124321.0</td>\n", + " <td>2157-10-21 12:15:00</td>\n", + " <td>74</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>124321.0</td>\n", + " <td>2157-10-21 13:00:00</td>\n", + " <td>67</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>124321.0</td>\n", + " <td>2157-10-21 14:00:00</td>\n", + " <td>64</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>124321.0</td>\n", + " <td>2157-10-21 15:00:00</td>\n", + " <td>76</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>124321.0</td>\n", + " <td>2157-10-21 16:17:00</td>\n", + " <td>80</td>\n", + " <td>mmHg</td>\n", + " <td>220051</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 124321.0 2157-10-21 12:15:00 74 mmHg 220051\n", + "1 124321.0 2157-10-21 13:00:00 67 mmHg 220051\n", + "2 124321.0 2157-10-21 14:00:00 64 mmHg 220051\n", + "3 124321.0 2157-10-21 15:00:00 76 mmHg 220051\n", + "4 124321.0 2157-10-21 16:17:00 80 mmHg 220051" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(6371249, 5)\n", + "(2017-06-03 03:31:34)<< DONE (94.0s)\n", + "(2017-06-03 03:31:34)>> BLOOD PRESSURE MEAN\n", + "(2017-06-03 03:31:34)>>>> Extracting 3 items from chartevents\n", + "(2017-06-03 03:32:13)<<<< DONE (39.0s)\n", + "(2017-06-03 03:32:13)>>>> Combine DF\n", + "(2017-06-03 03:32:13)<<<< DONE (0.0s)\n", + "(2017-06-03 03:32:13)>>>> Clean UOM\n", + "(2017-06-03 03:32:14)<<<< DONE (1.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>124321</td>\n", + " <td>2157-10-21 13:00:00</td>\n", + " <td>86</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>124321</td>\n", + " <td>2157-10-21 14:00:00</td>\n", + " <td>86</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>124321</td>\n", + " <td>2157-10-21 15:00:00</td>\n", + " <td>98</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>124321</td>\n", + " <td>2157-10-21 16:17:00</td>\n", + " <td>104</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>124321</td>\n", + " <td>2157-10-21 17:00:00</td>\n", + " <td>104</td>\n", + " <td>mmHg</td>\n", + " <td>220052</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 124321 2157-10-21 13:00:00 86 mmHg 220052\n", + "1 124321 2157-10-21 14:00:00 86 mmHg 220052\n", + "2 124321 2157-10-21 15:00:00 98 mmHg 220052\n", + "3 124321 2157-10-21 16:17:00 104 mmHg 220052\n", + "4 124321 2157-10-21 17:00:00 104 mmHg 220052" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2536271, 5)\n", + "(2017-06-03 03:32:18)<< DONE (44.0s)\n", + "(2017-06-03 03:32:18)>> RESPIRATORY RATE\n", + "(2017-06-03 03:32:18)>>>> Extracting 4 items from chartevents\n", + "(2017-06-03 03:34:08)<<<< DONE (110.0s)\n", + "(2017-06-03 03:34:08)>>>> Combine DF\n", + "(2017-06-03 03:34:08)<<<< DONE (0.0s)\n", + "(2017-06-03 03:34:08)>>>> Clean UOM\n", + "(2017-06-03 03:34:13)<<<< DONE (5.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:00:00</td>\n", + " <td>20</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>122659.0</td>\n", + " <td>2131-05-22 14:00:00</td>\n", + " <td>29</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 19:00:00</td>\n", + " <td>24</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>24</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-10 13:30:00</td>\n", + " <td>22</td>\n", + " <td>breath/min</td>\n", + " <td>618</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-25 00:00:00 20 breath/min 618\n", + "1 122659.0 2131-05-22 14:00:00 29 breath/min 618\n", + "2 188670.0 2183-08-23 19:00:00 24 breath/min 618\n", + "3 188670.0 2183-08-23 20:00:00 24 breath/min 618\n", + "4 185910.0 2166-08-10 13:30:00 22 breath/min 618" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(7810019, 5)\n", + "(2017-06-03 03:34:27)<< DONE (129.0s)\n", + "(2017-06-03 03:34:27)>> TEMPERATURE BODY\n", + "(2017-06-03 03:34:27)>>>> Extracting 4 items from chartevents\n", + "(2017-06-03 03:35:01)<<<< DONE (34.0s)\n", + "(2017-06-03 03:35:01)>>>> Combine DF\n", + "(2017-06-03 03:35:01)<<<< DONE (0.0s)\n", + "(2017-06-03 03:35:01)>>>> Clean UOM\n", + "(2017-06-03 03:35:02)<<<< DONE (1.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:00:00</td>\n", + " <td>98.400001525878906</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>99.300003051757812</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-12 08:00:00</td>\n", + " <td>98.699996948242188</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-13 17:00:00</td>\n", + " <td>99.900001525878906</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>166707.0</td>\n", + " <td>2122-02-11 20:00:00</td>\n", + " <td>37.900001525878906</td>\n", + " <td>degC</td>\n", + " <td>676</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-25 00:00:00 98.400001525878906 degF 678\n", + "1 188670.0 2183-08-23 20:00:00 99.300003051757812 degF 678\n", + "2 185910.0 2166-08-12 08:00:00 98.699996948242188 degF 678\n", + "3 185910.0 2166-08-13 17:00:00 99.900001525878906 degF 678\n", + "4 166707.0 2122-02-11 20:00:00 37.900001525878906 degC 676" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(1751447, 5)\n", + "(2017-06-03 03:35:05)<< DONE (38.0s)\n", + "(2017-06-03 03:35:05)>> OXYGEN SATURATION PULSE OXIMETRY\n", + "(2017-06-03 03:35:06)>>>> Extracting 2 items from chartevents\n", + "(2017-06-03 03:35:59)<<<< DONE (53.0s)\n", + "(2017-06-03 03:35:59)>>>> Combine DF\n", + "(2017-06-03 03:35:59)<<<< DONE (0.0s)\n", + "(2017-06-03 03:35:59)>>>> Clean UOM\n", + "(2017-06-03 03:36:02)<<<< DONE (3.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:00:00</td>\n", + " <td>100</td>\n", + " <td>percent</td>\n", + " <td>646</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:15:00</td>\n", + " <td>100</td>\n", + " <td>percent</td>\n", + " <td>646</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>122659.0</td>\n", + " <td>2131-05-22 14:00:00</td>\n", + " <td>100</td>\n", + " <td>percent</td>\n", + " <td>646</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 19:00:00</td>\n", + " <td>97</td>\n", + " <td>percent</td>\n", + " <td>646</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>97</td>\n", + " <td>percent</td>\n", + " <td>646</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-25 00:00:00 100 percent 646\n", + "1 185910.0 2166-08-25 00:15:00 100 percent 646\n", + "2 122659.0 2131-05-22 14:00:00 100 percent 646\n", + "3 188670.0 2183-08-23 19:00:00 97 percent 646\n", + "4 188670.0 2183-08-23 20:00:00 97 percent 646" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(6099827, 5)\n", + "(2017-06-03 03:36:14)<< DONE (69.0s)\n", + "(2017-06-03 03:36:14)>> WEIGHT BODY\n", + "(2017-06-03 03:36:14)>>>> Extracting 3 items from chartevents\n", + "(2017-06-03 03:36:48)<<<< DONE (34.0s)\n", + "(2017-06-03 03:36:48)>>>> Combine DF\n", + "(2017-06-03 03:36:49)<<<< DONE (1.0s)\n", + "(2017-06-03 03:36:49)>>>> Clean UOM\n", + "(2017-06-03 03:36:49)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-20 06:00:00</td>\n", + " <td>102.5</td>\n", + " <td>kg</td>\n", + " <td>763</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>166707.0</td>\n", + " <td>2122-02-15 07:00:00</td>\n", + " <td>99.400001525878906</td>\n", + " <td>kg</td>\n", + " <td>763</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>182104.0</td>\n", + " <td>2131-05-05 06:00:00</td>\n", + " <td>109.69999694824219</td>\n", + " <td>kg</td>\n", + " <td>763</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>157907.0</td>\n", + " <td>2129-06-10 05:00:00</td>\n", + " <td>103.19999694824219</td>\n", + " <td>kg</td>\n", + " <td>763</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>166707.0</td>\n", + " <td>2122-02-14 06:00:00</td>\n", + " <td>101.80000305175781</td>\n", + " <td>kg</td>\n", + " <td>763</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-20 06:00:00 102.5 kg 763\n", + "1 166707.0 2122-02-15 07:00:00 99.400001525878906 kg 763\n", + "2 182104.0 2131-05-05 06:00:00 109.69999694824219 kg 763\n", + "3 157907.0 2129-06-10 05:00:00 103.19999694824219 kg 763\n", + "4 166707.0 2122-02-14 06:00:00 101.80000305175781 kg 763" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(95425, 5)\n", + "(2017-06-03 03:36:49)<< DONE (35.0s)\n", + "(2017-06-03 03:36:49)>> OUTPUT URINE\n", + "(2017-06-03 03:36:49)>>>> Extracting 2 items from chartevents\n", + "(2017-06-03 03:37:28)<<<< DONE (39.0s)\n", + "(2017-06-03 03:37:28)>>>> Extracting 29 items from outputevents\n", + "(2017-06-03 03:37:59)<<<< DONE (31.0s)\n", + "(2017-06-03 03:37:59)>>>> Combine DF\n", + "(2017-06-03 03:37:59)<<<< DONE (0.0s)\n", + "(2017-06-03 03:37:59)>>>> Clean UOM\n", + "(2017-06-03 03:38:09)<<<< DONE (10.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-03 08:00:00</td>\n", + " <td>Voiding qs</td>\n", + " <td>ml</td>\n", + " <td>3686</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-09 09:00:00</td>\n", + " <td>Voiding qs</td>\n", + " <td>ml</td>\n", + " <td>3686</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-09 14:00:00</td>\n", + " <td>Voiding qs</td>\n", + " <td>ml</td>\n", + " <td>3686</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-05 21:30:00</td>\n", + " <td>Voiding qs</td>\n", + " <td>ml</td>\n", + " <td>3686</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>106266.0</td>\n", + " <td>2114-12-04 16:00:00</td>\n", + " <td>Voiding qs</td>\n", + " <td>ml</td>\n", + " <td>3686</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 106266.0 2114-12-03 08:00:00 Voiding qs ml 3686\n", + "1 106266.0 2114-12-09 09:00:00 Voiding qs ml 3686\n", + "2 106266.0 2114-12-09 14:00:00 Voiding qs ml 3686\n", + "3 106266.0 2114-12-05 21:30:00 Voiding qs ml 3686\n", + "4 106266.0 2114-12-04 16:00:00 Voiding qs ml 3686" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(3644639, 5)\n", + "(2017-06-03 03:38:15)<< DONE (86.0s)\n", + "(2017-06-03 03:38:15)>> GLASGOW COMA SCALE MOTOR\n", + "(2017-06-03 03:38:15)>>>> Extracting 1 items from chartevents\n", + "(2017-06-03 03:39:12)<<<< DONE (57.0s)\n", + "(2017-06-03 03:39:12)>>>> Combine DF\n", + "(2017-06-03 03:39:12)<<<< DONE (0.0s)\n", + "(2017-06-03 03:39:12)>>>> Clean UOM\n", + "(2017-06-03 03:39:12)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:00:00</td>\n", + " <td>6 Obeys Commands</td>\n", + " <td></td>\n", + " <td>454</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>6 Obeys Commands</td>\n", + " <td></td>\n", + " <td>454</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-27 12:00:00</td>\n", + " <td>5 Localizes Pain</td>\n", + " <td></td>\n", + " <td>454</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>185910.0</td>\n", + " <td>2166-09-03 12:00:00</td>\n", + " <td>6 Obeys Commands</td>\n", + " <td></td>\n", + " <td>454</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>101757.0</td>\n", + " <td>2133-01-03 16:00:00</td>\n", + " <td>6 Obeys Commands</td>\n", + " <td></td>\n", + " <td>454</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-25 00:00:00 6 Obeys Commands 454\n", + "1 188670.0 2183-08-23 20:00:00 6 Obeys Commands 454\n", + "2 185910.0 2166-08-27 12:00:00 5 Localizes Pain 454\n", + "3 185910.0 2166-09-03 12:00:00 6 Obeys Commands 454\n", + "4 101757.0 2133-01-03 16:00:00 6 Obeys Commands 454" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(952565, 5)\n", + "(2017-06-03 03:39:13)<< DONE (58.0s)\n", + "(2017-06-03 03:39:13)>> GLASGOW COMA SCALE EYE OPENING\n", + "(2017-06-03 03:39:13)>>>> Extracting 1 items from chartevents\n", + "(2017-06-03 03:39:57)<<<< DONE (44.0s)\n", + "(2017-06-03 03:39:57)>>>> Combine DF\n", + "(2017-06-03 03:39:57)<<<< DONE (0.0s)\n", + "(2017-06-03 03:39:57)>>>> Clean UOM\n", + "(2017-06-03 03:39:57)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>4 Spontaneously</td>\n", + " <td></td>\n", + " <td>184</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-15 20:00:00</td>\n", + " <td>4 Spontaneously</td>\n", + " <td></td>\n", + " <td>184</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-16 16:00:00</td>\n", + " <td>3 To speech</td>\n", + " <td></td>\n", + " <td>184</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-23 04:00:00</td>\n", + " <td>3 To speech</td>\n", + " <td></td>\n", + " <td>184</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-27 12:00:00</td>\n", + " <td>1 No Response</td>\n", + " <td></td>\n", + " <td>184</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 188670.0 2183-08-23 20:00:00 4 Spontaneously 184\n", + "1 185910.0 2166-08-15 20:00:00 4 Spontaneously 184\n", + "2 185910.0 2166-08-16 16:00:00 3 To speech 184\n", + "3 185910.0 2166-08-23 04:00:00 3 To speech 184\n", + "4 185910.0 2166-08-27 12:00:00 1 No Response 184" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(956672, 5)\n", + "(2017-06-03 03:39:58)<< DONE (45.0s)\n", + "(2017-06-03 03:39:58)>> GLASGOW COMA SCALE VERBAL\n", + "(2017-06-03 03:39:59)>>>> Extracting 1 items from chartevents\n", + "(2017-06-03 03:40:22)<<<< DONE (23.0s)\n", + "(2017-06-03 03:40:22)>>>> Combine DF\n", + "(2017-06-03 03:40:22)<<<< DONE (0.0s)\n", + "(2017-06-03 03:40:22)>>>> Clean UOM\n", + "(2017-06-03 03:40:22)<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:00:00</td>\n", + " <td>1.0 ET/Trach</td>\n", + " <td></td>\n", + " <td>723</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>4 Confused</td>\n", + " <td></td>\n", + " <td>723</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-12 08:00:00</td>\n", + " <td>1.0 ET/Trach</td>\n", + " <td></td>\n", + " <td>723</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-27 12:00:00</td>\n", + " <td>1.0 ET/Trach</td>\n", + " <td></td>\n", + " <td>723</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>166707.0</td>\n", + " <td>2122-02-11 20:00:00</td>\n", + " <td>5 Oriented</td>\n", + " <td></td>\n", + " <td>723</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-25 00:00:00 1.0 ET/Trach 723\n", + "1 188670.0 2183-08-23 20:00:00 4 Confused 723\n", + "2 185910.0 2166-08-12 08:00:00 1.0 ET/Trach 723\n", + "3 185910.0 2166-08-27 12:00:00 1.0 ET/Trach 723\n", + "4 166707.0 2122-02-11 20:00:00 5 Oriented 723" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(954700, 5)\n", + "(2017-06-03 03:40:24)<< DONE (26.0s)\n", + "(2017-06-03 03:40:24)>> NORMAL SALINE\n", + "(2017-06-03 03:40:24)>>>> Extracting 2 items from chartevents\n", + "(2017-06-03 03:40:24)<<<< DONE (0.0s)\n", + "(2017-06-03 03:40:24)>>>> Extracting 4 items from inputevents_cv\n", + "(2017-06-03 03:40:25)<<<< DONE (1.0s)\n", + "(2017-06-03 03:40:25)>>>> Extracting 2 items from inputevents_mv\n", + "(2017-06-03 03:40:43)<<<< DONE (18.0s)\n", + "(2017-06-03 03:40:43)>>>> Combine DF\n", + "(2017-06-03 03:40:43)<<<< DONE (0.0s)\n", + "(2017-06-03 03:40:43)>>>> Clean UOM\n", + "(2017-06-03 03:40:46)<<<< DONE (3.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>110468</td>\n", + " <td>2134-02-13 03:45:00</td>\n", + " <td>given</td>\n", + " <td>ml</td>\n", + " <td>4647</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>110468</td>\n", + " <td>2134-02-13 07:05:00</td>\n", + " <td>given</td>\n", + " <td>ml</td>\n", + " <td>4647</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>175419</td>\n", + " <td>2122-08-16 01:00:00</td>\n", + " <td>given</td>\n", + " <td>ml</td>\n", + " <td>4647</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>143494</td>\n", + " <td>2147-07-02 23:00:00</td>\n", + " <td>given</td>\n", + " <td>ml</td>\n", + " <td>4647</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>143494</td>\n", + " <td>2147-07-02 23:43:00</td>\n", + " <td>given</td>\n", + " <td>ml</td>\n", + " <td>4647</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 110468 2134-02-13 03:45:00 given ml 4647\n", + "1 110468 2134-02-13 07:05:00 given ml 4647\n", + "2 175419 2122-08-16 01:00:00 given ml 4647\n", + "3 143494 2147-07-02 23:00:00 given ml 4647\n", + "4 143494 2147-07-02 23:43:00 given ml 4647" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(817373, 5)\n", + "(2017-06-03 03:40:46)<< DONE (22.0s)\n", + "(2017-06-03 03:40:46)>> LACTATED RINGERS\n", + "(2017-06-03 03:40:46)>>>> Extracting 2 items from chartevents\n", + "(2017-06-03 03:40:46)<<<< DONE (0.0s)\n", + "(2017-06-03 03:40:46)>>>> Extracting 7 items from inputevents_cv\n", + "(2017-06-03 03:40:50)<<<< DONE (4.0s)\n", + "(2017-06-03 03:40:50)>>>> Extracting 2 items from inputevents_mv\n", + "(2017-06-03 03:40:51)<<<< DONE (1.0s)\n", + "(2017-06-03 03:40:51)>>>> Combine DF\n", + "(2017-06-03 03:40:51)<<<< DONE (0.0s)\n", + "(2017-06-03 03:40:51)>>>> Clean UOM\n", + "(2017-06-03 03:40:53)<<<< DONE (2.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>194762.0</td>\n", + " <td>2110-11-22 18:00:00</td>\n", + " <td>100</td>\n", + " <td>ml</td>\n", + " <td>1634</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>178769.0</td>\n", + " <td>2181-06-01 05:00:00</td>\n", + " <td>100</td>\n", + " <td>ml</td>\n", + " <td>2971</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>178769.0</td>\n", + " <td>2181-06-01 01:00:00</td>\n", + " <td>100</td>\n", + " <td>ml</td>\n", + " <td>2971</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>178769.0</td>\n", + " <td>2181-06-01 02:00:00</td>\n", + " <td>100</td>\n", + " <td>ml</td>\n", + " <td>2971</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>178769.0</td>\n", + " <td>2181-06-01 03:00:00</td>\n", + " <td>100</td>\n", + " <td>ml</td>\n", + " <td>2971</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 194762.0 2110-11-22 18:00:00 100 ml 1634\n", + "1 178769.0 2181-06-01 05:00:00 100 ml 2971\n", + "2 178769.0 2181-06-01 01:00:00 100 ml 2971\n", + "3 178769.0 2181-06-01 02:00:00 100 ml 2971\n", + "4 178769.0 2181-06-01 03:00:00 100 ml 2971" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(504306, 5)\n", + "(2017-06-03 03:40:53)<< DONE (7.0s)\n", + "(2017-06-03 03:40:53)>> NOREPINEPHRINE\n", + "(2017-06-03 03:40:53)>>>> Extracting 2 items from inputevents_cv\n", + "(2017-06-03 03:41:10)<<<< DONE (17.0s)\n", + "(2017-06-03 03:41:10)>>>> Extracting 1 items from inputevents_mv\n", + "(2017-06-03 03:41:12)<<<< DONE (2.0s)\n", + "(2017-06-03 03:41:12)>>>> Combine DF\n", + "(2017-06-03 03:41:12)<<<< DONE (0.0s)\n", + "(2017-06-03 03:41:12)>>>> Clean UOM\n", + "(2017-06-03 03:41:16)<<<< DONE (4.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>181516.0</td>\n", + " <td>2121-01-27 00:00:00</td>\n", + " <td>NaN</td>\n", + " <td>mg</td>\n", + " <td>30120</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>194502.0</td>\n", + " <td>2102-12-20 08:00:00</td>\n", + " <td>NaN</td>\n", + " <td>mg</td>\n", + " <td>30047</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>172260.0</td>\n", + " <td>2124-11-11 16:00:00</td>\n", + " <td>NaN</td>\n", + " <td>mg</td>\n", + " <td>30047</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>114829.0</td>\n", + " <td>2107-01-15 22:00:00</td>\n", + " <td>NaN</td>\n", + " <td>mg</td>\n", + " <td>30047</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>181516.0</td>\n", + " <td>2121-01-27 01:00:00</td>\n", + " <td>NaN</td>\n", + " <td>mg</td>\n", + " <td>30120</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 181516.0 2121-01-27 00:00:00 NaN mg 30120\n", + "1 194502.0 2102-12-20 08:00:00 NaN mg 30047\n", + "2 172260.0 2124-11-11 16:00:00 NaN mg 30047\n", + "3 114829.0 2107-01-15 22:00:00 NaN mg 30047\n", + "4 181516.0 2121-01-27 01:00:00 NaN mg 30120" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(1136938, 5)\n", + "(2017-06-03 03:41:16)<< DONE (23.0s)\n", + "(2017-06-03 03:41:16)>> VASOPRESSIN\n", + "(2017-06-03 03:41:16)>>>> Extracting 10 items from chartevents\n", + "(2017-06-03 03:41:17)<<<< DONE (1.0s)\n", + "(2017-06-03 03:41:17)>>>> Extracting 4 items from inputevents_cv\n", + "(2017-06-03 03:41:22)<<<< DONE (5.0s)\n", + "(2017-06-03 03:41:22)>>>> Extracting 1 items from inputevents_mv\n", + "(2017-06-03 03:41:23)<<<< DONE (1.0s)\n", + "(2017-06-03 03:41:23)>>>> Combine DF\n", + "(2017-06-03 03:41:23)<<<< DONE (0.0s)\n", + "(2017-06-03 03:41:23)>>>> Clean UOM\n", + "(2017-06-03 03:41:24)<<<< DONE (1.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>126005.0</td>\n", + " <td>2126-09-05 16:30:00</td>\n", + " <td></td>\n", + " <td>U</td>\n", + " <td>1136</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>126005.0</td>\n", + " <td>2126-09-05 16:45:00</td>\n", + " <td></td>\n", + " <td>units/hour</td>\n", + " <td>1136</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>115221.0</td>\n", + " <td>2194-12-09 05:00:00</td>\n", + " <td>3</td>\n", + " <td>U</td>\n", + " <td>1136</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>115221.0</td>\n", + " <td>2194-12-09 06:00:00</td>\n", + " <td>3</td>\n", + " <td>units/hour</td>\n", + " <td>1136</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>115221.0</td>\n", + " <td>2194-12-09 04:00:00</td>\n", + " <td>3</td>\n", + " <td>units/hour</td>\n", + " <td>1136</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 126005.0 2126-09-05 16:30:00 U 1136\n", + "1 126005.0 2126-09-05 16:45:00 units/hour 1136\n", + "2 115221.0 2194-12-09 05:00:00 3 U 1136\n", + "3 115221.0 2194-12-09 06:00:00 3 units/hour 1136\n", + "4 115221.0 2194-12-09 04:00:00 3 units/hour 1136" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(339184, 5)\n", + "(2017-06-03 03:41:24)<< DONE (8.0s)\n", + "(2017-06-03 03:41:24)>> HEMOGLOBIN\n", + "(2017-06-03 03:41:24)>>>> Extracting 3 items from chartevents\n", + "(2017-06-03 03:43:00)<<<< DONE (96.0s)\n", + "(2017-06-03 03:43:00)>>>> Extracting 2 items from labevents\n", + "(2017-06-03 03:43:27)<<<< DONE (27.0s)\n", + "(2017-06-03 03:43:27)>>>> Combine DF\n", + "(2017-06-03 03:43:27)<<<< DONE (0.0s)\n", + "(2017-06-03 03:43:27)>>>> Clean UOM\n", + "(2017-06-03 03:43:30)<<<< DONE (3.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-13 01:53:00</td>\n", + " <td>9.5</td>\n", + " <td>gm/dl</td>\n", + " <td>814</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-22 02:14:00</td>\n", + " <td>10</td>\n", + " <td>gm/dl</td>\n", + " <td>814</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-18 03:46:00</td>\n", + " <td>10.100000381469727</td>\n", + " <td>gm/dl</td>\n", + " <td>814</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>157907.0</td>\n", + " <td>2129-06-11 02:00:00</td>\n", + " <td>9.8999996185302734</td>\n", + " <td>gm/dl</td>\n", + " <td>814</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-30 02:07:00</td>\n", + " <td>9</td>\n", + " <td>gm/dl</td>\n", + " <td>814</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-13 01:53:00 9.5 gm/dl 814\n", + "1 185910.0 2166-08-22 02:14:00 10 gm/dl 814\n", + "2 185910.0 2166-08-18 03:46:00 10.100000381469727 gm/dl 814\n", + "3 157907.0 2129-06-11 02:00:00 9.8999996185302734 gm/dl 814\n", + "4 185910.0 2166-08-30 02:07:00 9 gm/dl 814" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(1167921, 5)\n", + "(2017-06-03 03:43:31)<< DONE (127.0s)\n", + "(2017-06-03 03:43:31)>> LACTATE\n", + "(2017-06-03 03:43:31)>>>> Extracting 3 items from chartevents\n", + "(2017-06-03 03:44:30)<<<< DONE (59.0s)\n", + "(2017-06-03 03:44:30)>>>> Extracting 1 items from labevents\n", + "(2017-06-03 03:44:33)<<<< DONE (3.0s)\n", + "(2017-06-03 03:44:33)>>>> Combine DF\n", + "(2017-06-03 03:44:33)<<<< DONE (0.0s)\n", + "(2017-06-03 03:44:33)>>>> Clean UOM\n", + "(2017-06-03 03:44:34)<<<< DONE (1.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-11 21:20:00</td>\n", + " <td>1.5</td>\n", + " <td>mmol/L</td>\n", + " <td>818</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-11 21:20:00</td>\n", + " <td>1.5</td>\n", + " <td>mmol/L</td>\n", + " <td>1531</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>175413.0</td>\n", + " <td>2170-04-11 15:00:00</td>\n", + " <td></td>\n", + " <td>mmol/L</td>\n", + " <td>818</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>146828.0</td>\n", + " <td>2186-10-03 21:54:00</td>\n", + " <td>1.8</td>\n", + " <td>mmol/L</td>\n", + " <td>818</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>146828.0</td>\n", + " <td>2186-10-03 21:54:00</td>\n", + " <td>1.8</td>\n", + " <td>mmol/L</td>\n", + " <td>1531</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-11 21:20:00 1.5 mmol/L 818\n", + "1 185910.0 2166-08-11 21:20:00 1.5 mmol/L 1531\n", + "2 175413.0 2170-04-11 15:00:00 mmol/L 818\n", + "3 146828.0 2186-10-03 21:54:00 1.8 mmol/L 818\n", + "4 146828.0 2186-10-03 21:54:00 1.8 mmol/L 1531" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(393608, 5)\n", + "(2017-06-03 03:44:35)<< DONE (64.0s)\n", + "(2017-06-03 03:44:35) DONE (1045.0s)\n" + ] + } + ], + "source": [ + "df_all = extract_labels(conn,labels,item_map_fname,hdf5_fname)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Transform (and \"Load\") MIMIC III Data" + ] + }, + { + "cell_type": "code", + "execution_count": 152, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "import icu_data_defs \n", + "import mimic\n", + "from sklearn.pipeline import Pipeline\n", + "import logger\n", + "import pandas as pd\n", + "from constants import column_names\n", + "import utils\n", + "import warnings\n", + "warnings.filterwarnings('ignore')" + ] + }, + { + "cell_type": "code", + "execution_count": 153, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(utils)\n", + "reload(logger)\n", + "reload(mimic)\n", + "def transform_extracted_labels(labels,hdf5_fname):\n", + " \n", + " pipeline = Pipeline([\n", + " ('clean',mimic.clean_extract()),\n", + " ('unstack',mimic.unstacker()),\n", + " ('clean_uom',mimic.clean_uom())\n", + " ])\n", + " \n", + " for label in labels:\n", + " logger.log('Opening {}'.format(label.upper()))\n", + " df = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n", + " logger.log('Transforming {} - {}'.format(label.upper(),df.shape))\n", + " df_transformed = pipeline.transform(df)\n", + " # Add label guess to column index\n", + " df = utils.add_same_val__index_level(df,label,'label',axis=1)\n", + " display(df_transformed.head())\n", + " utils.save_df(df_transformed,hdf5_fname,'transformed/{}'.format(label))\n", + " del df,df_transformed\n", + " logger.end_log_level()\n", + " \n", + " return\n", + " \n", + "mimic_data_sef_fname = 'config/data_definitions.xlsx'\n", + "hdf5_fname = 'data/mimic_data'\n", + "\n", + "#get all labels\n", + "data_dict = icu_data_defs.data_dictionary(mimic_data_sef_fname)\n", + "simple_data = data_dict.get_panel_defintions(12) #12 is \"simple data\"\n", + "labels = simple_data.label.unique().tolist()" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-02 05:11:14) Opening HEART RATE\n", + "(2017-06-02 05:11:19) DONE (5.0s)\n", + "(2017-06-02 05:11:19) Transforming HEART RATE - (7952939, 5)\n" + ] + }, + { + "ename": "KeyboardInterrupt", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "\u001b[1;32m<ipython-input-3-4ff30e8e4bcc>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mtransform_extracted_labels\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabels\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m", + "\u001b[1;32m<ipython-input-2-7e9518f41127>\u001b[0m in \u001b[0;36mtransform_extracted_labels\u001b[1;34m(labels, hdf5_fname)\u001b[0m\n\u001b[0;32m 14\u001b[0m \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mutils\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mopen_df\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'extract/{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabel\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 15\u001b[0m \u001b[0mlogger\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mlog\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'Transforming {} - {}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabel\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mupper\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 16\u001b[1;33m \u001b[0mdf_transformed\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpipeline\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mtransform\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 17\u001b[0m \u001b[0mdisplay\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf_transformed\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mhead\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 18\u001b[0m \u001b[0mutils\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msave_df\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf_transformed\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'transformed/{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabel\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\sklearn\\pipeline.pyc\u001b[0m in \u001b[0;36m_transform\u001b[1;34m(self, X)\u001b[0m\n\u001b[0;32m 446\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mname\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mtransform\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msteps\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 447\u001b[0m \u001b[1;32mif\u001b[0m \u001b[0mtransform\u001b[0m \u001b[1;32mis\u001b[0m \u001b[1;32mnot\u001b[0m \u001b[0mNone\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 448\u001b[1;33m \u001b[0mXt\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mtransform\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mtransform\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mXt\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 449\u001b[0m \u001b[1;32mreturn\u001b[0m \u001b[0mXt\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 450\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\mimic.pyc\u001b[0m in \u001b[0;36mtransform\u001b[1;34m(self, df)\u001b[0m\n\u001b[0;32m 189\u001b[0m \u001b[0mFORMAT\u001b[0m \u001b[0mpre\u001b[0m\u001b[1;33m-\u001b[0m\u001b[0munstack\u001b[0m \u001b[0mcolumns\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 190\u001b[0m \"\"\"\n\u001b[1;32m--> 191\u001b[1;33m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mreplace\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mto_replace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m''\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnp\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnan\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 192\u001b[0m \u001b[1;31m#drop NAN record_id, timestamps, or value\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 193\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mdropna\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0msubset\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mcolumn_names\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mID\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcolumn_names\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDATETIME\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcolumn_names\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mVALUE\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mhow\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m'any'\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\generic.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, to_replace, value, inplace, limit, regex, method, axis)\u001b[0m\n\u001b[0;32m 3538\u001b[0m new_data = self._data.replace(to_replace=to_replace,\n\u001b[0;32m 3539\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mvalue\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0minplace\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 3540\u001b[1;33m regex=regex)\n\u001b[0m\u001b[0;32m 3541\u001b[0m \u001b[1;32melse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3542\u001b[0m msg = ('Invalid \"to_replace\" type: '\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, **kwargs)\u001b[0m\n\u001b[0;32m 3172\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3173\u001b[0m \u001b[1;32mdef\u001b[0m \u001b[0mreplace\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 3174\u001b[1;33m \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mapply\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'replace'\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 3175\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3176\u001b[0m def replace_list(self, src_list, dest_list, inplace=False, regex=False,\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mapply\u001b[1;34m(self, f, axes, filter, do_integrity_check, consolidate, **kwargs)\u001b[0m\n\u001b[0;32m 3033\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3034\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'mgr'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 3035\u001b[1;33m \u001b[0mapplied\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mgetattr\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mb\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mf\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 3036\u001b[0m \u001b[0mresult_blocks\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0m_extend_blocks\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mapplied\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mresult_blocks\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3037\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, to_replace, value, inplace, filter, regex, convert, mgr)\u001b[0m\n\u001b[0;32m 1926\u001b[0m \u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0minplace\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 1927\u001b[0m \u001b[0mfilter\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mfilter\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mregex\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mregex\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 1928\u001b[1;33m convert=convert, mgr=mgr)\n\u001b[0m\u001b[0;32m 1929\u001b[0m \u001b[1;32melif\u001b[0m \u001b[0mboth_lists\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 1930\u001b[0m \u001b[1;32mfor\u001b[0m \u001b[0mto_rep\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mv\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mzip\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mto_replace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, to_replace, value, inplace, filter, regex, convert, mgr)\u001b[0m\n\u001b[0;32m 623\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 624\u001b[0m \u001b[0moriginal_to_replace\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mto_replace\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 625\u001b[1;33m \u001b[0mmask\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0misnull\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 626\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 627\u001b[0m \u001b[1;31m# try to replace, if we raise an error, convert to ObjectBlock and\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\types\\missing.pyc\u001b[0m in \u001b[0;36misnull\u001b[1;34m(obj)\u001b[0m\n\u001b[0;32m 43\u001b[0m \u001b[0mpandas\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnotnull\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mboolean\u001b[0m \u001b[0minverse\u001b[0m \u001b[0mof\u001b[0m \u001b[0mpandas\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0misnull\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 44\u001b[0m \"\"\"\n\u001b[1;32m---> 45\u001b[1;33m \u001b[1;32mreturn\u001b[0m \u001b[0m_isnull\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 46\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 47\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\types\\missing.pyc\u001b[0m in \u001b[0;36m_isnull_new\u001b[1;34m(obj)\u001b[0m\n\u001b[0;32m 53\u001b[0m \u001b[1;32mraise\u001b[0m \u001b[0mNotImplementedError\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m\"isnull is not defined for MultiIndex\"\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 54\u001b[0m \u001b[1;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mABCSeries\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mndarray\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mABCIndexClass\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 55\u001b[1;33m \u001b[1;32mreturn\u001b[0m \u001b[0m_isnull_ndarraylike\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 56\u001b[0m \u001b[1;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mABCGeneric\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 57\u001b[0m \u001b[1;32mreturn\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_constructor\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_data\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0misnull\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mfunc\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0misnull\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\types\\missing.pyc\u001b[0m in \u001b[0;36m_isnull_ndarraylike\u001b[1;34m(obj)\u001b[0m\n\u001b[0;32m 139\u001b[0m \u001b[0mresult\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mempty\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mbool\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 140\u001b[0m \u001b[0mvec\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mlib\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0misnullobj\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mvalues\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mravel\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 141\u001b[1;33m \u001b[0mresult\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;33m.\u001b[0m\u001b[1;33m.\u001b[0m\u001b[1;33m.\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvec\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mreshape\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 142\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 143\u001b[0m \u001b[1;32melif\u001b[0m \u001b[0mneeds_i8_conversion\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;31mKeyboardInterrupt\u001b[0m: " + ] + } + ], + "source": [ + "transform_extracted_labels(labels,hdf5_fname)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "store = pd.HDFStore(hdf5_fname)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "<class 'pandas.io.pytables.HDFStore'>\n", + "File path: data/mimic_data\n", + "/extract/blood pressure diastolic frame (shape->[6371249,5])\n", + "/extract/blood pressure mean frame (shape->[2536271,5])\n", + "/extract/blood pressure systolic frame (shape->[6374824,5])\n", + "/extract/glasgow coma scale eye opening frame (shape->[956672,5]) \n", + "/extract/glasgow coma scale motor frame (shape->[952565,5]) \n", + "/extract/glasgow coma scale verbal frame (shape->[954700,5]) \n", + "/extract/heart rate frame (shape->[7952939,5])\n", + "/extract/hemoglobin frame (shape->[1167921,5])\n", + "/extract/lactate frame (shape->[393608,5]) \n", + "/extract/lactated ringers frame (shape->[504306,5]) \n", + "/extract/norepinephrine frame (shape->[1136938,5])\n", + "/extract/normal saline frame (shape->[817373,5]) \n", + "/extract/output urine frame (shape->[3644639,5])\n", + "/extract/oxygen saturation pulse oximetry frame (shape->[6099827,5])\n", + "/extract/respiratory rate frame (shape->[7810019,5])\n", + "/extract/temperature body frame (shape->[1751447,5])\n", + "/extract/vasopressin frame (shape->[339184,5]) \n", + "/extract/weight body frame (shape->[95425,5]) \n", + "/transformed/blood pressure diastolic frame \n", + "/transformed/blood pressure mean frame \n", + "/transformed/blood pressure systolic frame \n", + "/transformed/glasgow coma scale eye opening frame \n", + "/transformed/glasgow coma scale motor frame \n", + "/transformed/glasgow coma scale verbal frame \n", + "/transformed/heart rate frame \n", + "/transformed/hemoglobin frame \n", + "/transformed/lactate frame \n", + "/transformed/lactated ringers frame \n", + "/transformed/norepinephrine frame \n", + "/transformed/normal saline frame \n", + "/transformed/output urine frame \n", + "/transformed/oxygen saturation pulse oximetry frame \n", + "/transformed/respiratory rate frame \n", + "/transformed/temperature body frame \n", + "/transformed/vasopressin frame \n", + "/transformed/weight body frame " + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "store" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "store.close()" + ] + }, + { + "cell_type": "code", + "execution_count": 116, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "<module 'utils' from 'utils.py'>" + ] + }, + "execution_count": 116, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "reload(utils)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Cleaners" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Design decision: If a given column has both NUMERIC CATEGORICAL and QUANTITATIVE data, all NUMERIC CATEGORICAL data will actually be treated like QUANTITATIVE data, unfortunately." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "import transformers\n", + "import utils\n", + "from sklearn.pipeline import Pipeline\n", + "from units import MedicalUreg\n", + "import icu_data_defs\n", + "import units\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(transformers)\n", + "reload(utils)\n", + "mimic_data_sef_fname = 'config/data_definitions.xlsx'\n", + "hdf5_fname = 'data/mimic_data'\n", + "medical_units = 'config/medical_units.txt'\n", + "\n", + "#get all labels\n", + "data_dict = icu_data_defs.data_dictionary(mimic_data_sef_fname)\n", + "label = 'lactate'\n", + "\n", + "standard_pipeline = Pipeline([\n", + " ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func=lambda x:x.iloc[0])),\n", + " ('split_dtype',transformers.split_dtype()),\n", + " ('format_columns',transformers.format_columns(data_dict,MedicalUreg(medical_units))),\n", + " ('drop_small_columns',transformers.remove_small_columns(threshold=50))\n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "transformers.py:103: SettingWithCopyWarning: \n", + "A value is trying to be set on a copy of a slice from a DataFrame\n", + "\n", + "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy\n", + " df_out.dropna(how='all',inplace=True,axis=1)\n" + ] + }, + { + "data": { + "text/plain": [ + "(113L, 0, '0.0%')" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df = utils.open_df('data/mimic_data','transformed/{}'.format(label))\n", + "df_cleaned = standard_pipeline.transform(df)\n", + "utils.data_loss(df,df_cleaned)" + ] + }, + { + "cell_type": "code", + "execution_count": 216, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"6\" halign=\"left\">lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"4\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"2\" halign=\"left\">mmol/L</th>\n", + " <th colspan=\"2\" halign=\"left\">no_units</th>\n", + " <th colspan=\"2\" halign=\"left\">no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>50813</th>\n", + " <th>225668</th>\n", + " <th>818</th>\n", + " <th>1531</th>\n", + " <th>50813(mmol/L)</th>\n", + " <th>818</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>100001</th>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100003</th>\n", + " <th>2150-04-17 19:12:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100006</th>\n", + " <th>2108-04-08 10:58:00</th>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100007</th>\n", + " <th>2145-03-31 00:44:00</th>\n", + " <td>3.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2145-04-02 14:10:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100009</th>\n", + " <th>2162-05-17 13:19:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2162-05-17 17:14:00</th>\n", + " <td>1.5</td>\n", + " <td>1.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">100010</th>\n", + " <th>2109-12-10 10:25:00</th>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 12:11:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:05:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:58:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100011</th>\n", + " <th>2177-08-29 04:44:00</th>\n", + " <td>3.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-08-29 06:55:00</th>\n", + " <td>2.3</td>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100012</th>\n", + " <th>2177-03-14 07:38:00</th>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-14 11:42:00</th>\n", + " <td>2.5</td>\n", + " <td>2.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 08:05:00</th>\n", + " <td>2.1</td>\n", + " <td>2.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 14:01:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 21:42:00</th>\n", + " <td>1.8</td>\n", + " <td>1.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100016</th>\n", + " <th>2188-05-24 12:00:00</th>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100017</th>\n", + " <th>2103-03-11 05:10:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100018</th>\n", + " <th>2176-08-29 15:29:00</th>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 09:23:00</th>\n", + " <td>0.9</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 10:19:00</th>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 11:29:00</th>\n", + " <td>0.9</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 12:40:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100020</th>\n", + " <th>2142-11-30 21:54:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2142-12-03 00:17:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100024</th>\n", + " <th>2170-09-19 10:25:00</th>\n", + " <td>1.4</td>\n", + " <td>1.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-19 16:33:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-20 02:04:00</th>\n", + " <td>3.2</td>\n", + " <td>3.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199976</th>\n", + " <th>2182-02-14 11:15:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-16 03:57:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-19 03:59:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-20 03:31:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-21 04:55:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199979</th>\n", + " <th>2182-02-06 09:17:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-06 14:16:00</th>\n", + " <td>3.8</td>\n", + " <td>3.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">199981</th>\n", + " <th>2110-09-24 16:34:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-24 20:09:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-25 06:10:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>199987</th>\n", + " <th>2175-05-19 16:30:00</th>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"6\" valign=\"top\">199988</th>\n", + " <th>2169-01-24 12:48:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 01:35:00</th>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 11:18:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 16:43:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 22:35:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-10 05:33:00</th>\n", + " <td>1.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199993</th>\n", + " <th>2161-11-12 23:14:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2161-11-13 03:46:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">199994</th>\n", + " <th>2188-07-07 21:23:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 03:09:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 04:13:00</th>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 06:20:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199998</th>\n", + " <th>2119-02-20 10:52:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 12:36:00</th>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:33:00</th>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:59:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 20:43:00</th>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199999</th>\n", + " <th>2136-04-04 20:55:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-06 15:29:00</th>\n", + " <td>1.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>177451 rows × 6 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label lactate \n", + "status known unknown \n", + "variable_type qn qn nom \n", + "units mmol/L no_units no_units \n", + "description 50813 225668 818 1531 50813(mmol/L) 818\n", + "id datetime \n", + "100001 2117-09-11 09:32:00 1.9 NaN NaN NaN NaN NaN\n", + "100003 2150-04-17 19:12:00 1.1 1.1 NaN NaN NaN NaN\n", + "100006 2108-04-08 10:58:00 4.5 NaN 4.5 NaN NaN NaN\n", + "100007 2145-03-31 00:44:00 3.1 NaN NaN NaN NaN NaN\n", + " 2145-04-02 14:10:00 1.9 NaN NaN NaN NaN NaN\n", + "100009 2162-05-17 13:19:00 1.1 1.1 NaN NaN NaN NaN\n", + " 2162-05-17 17:14:00 1.5 1.5 NaN NaN NaN NaN\n", + "100010 2109-12-10 10:25:00 0.6 NaN NaN NaN NaN NaN\n", + " 2109-12-10 12:11:00 0.9 NaN NaN NaN NaN NaN\n", + " 2109-12-10 13:05:00 1.0 NaN NaN NaN NaN NaN\n", + " 2109-12-10 13:58:00 0.8 NaN NaN NaN NaN NaN\n", + "100011 2177-08-29 04:44:00 3.8 NaN NaN NaN NaN NaN\n", + " 2177-08-29 06:55:00 2.3 2.3 NaN NaN NaN NaN\n", + "100012 2177-03-14 07:38:00 2.3 NaN NaN NaN NaN NaN\n", + " 2177-03-14 11:42:00 2.5 2.5 NaN NaN NaN NaN\n", + " 2177-03-15 08:05:00 2.1 2.1 NaN NaN NaN NaN\n", + " 2177-03-15 14:01:00 2.6 2.6 NaN NaN NaN NaN\n", + " 2177-03-15 21:42:00 1.8 1.8 NaN NaN NaN NaN\n", + "100016 2188-05-24 12:00:00 2.0 NaN NaN NaN NaN NaN\n", + "100017 2103-03-11 05:10:00 1.1 NaN 1.1 NaN NaN NaN\n", + "100018 2176-08-29 15:29:00 1.3 NaN NaN NaN NaN NaN\n", + " 2176-08-30 09:23:00 0.9 0.9 NaN NaN NaN NaN\n", + " 2176-08-30 10:19:00 1.0 1.0 NaN NaN NaN NaN\n", + " 2176-08-30 11:29:00 0.9 0.9 NaN NaN NaN NaN\n", + " 2176-08-30 12:40:00 1.1 1.1 NaN NaN NaN NaN\n", + "100020 2142-11-30 21:54:00 1.1 NaN NaN NaN NaN NaN\n", + " 2142-12-03 00:17:00 1.0 NaN NaN NaN NaN NaN\n", + "100024 2170-09-19 10:25:00 1.4 1.4 NaN NaN NaN NaN\n", + " 2170-09-19 16:33:00 2.6 2.6 NaN NaN NaN NaN\n", + " 2170-09-20 02:04:00 3.2 3.2 NaN NaN NaN NaN\n", + "... ... ... ... ... ... ...\n", + "199976 2182-02-14 11:15:00 0.8 NaN 0.8 NaN NaN NaN\n", + " 2182-02-16 03:57:00 0.8 NaN 0.8 NaN NaN NaN\n", + " 2182-02-19 03:59:00 0.8 NaN 0.8 NaN NaN NaN\n", + " 2182-02-20 03:31:00 0.7 NaN 0.7 NaN NaN NaN\n", + " 2182-02-21 04:55:00 0.9 NaN 0.9 NaN NaN NaN\n", + "199979 2182-02-06 09:17:00 1.0 NaN NaN NaN NaN NaN\n", + " 2182-02-06 14:16:00 3.8 3.8 NaN NaN NaN NaN\n", + "199981 2110-09-24 16:34:00 1.1 NaN 1.1 1.1 NaN NaN\n", + " 2110-09-24 20:09:00 1.0 NaN 1.0 1.0 NaN NaN\n", + " 2110-09-25 06:10:00 1.0 NaN 1.0 1.0 NaN NaN\n", + "199987 2175-05-19 16:30:00 2.3 NaN NaN NaN NaN NaN\n", + "199988 2169-01-24 12:48:00 1.0 NaN NaN NaN NaN NaN\n", + " 2169-02-07 01:35:00 1.6 NaN 1.6 NaN NaN NaN\n", + " 2169-02-07 11:18:00 1.0 NaN 1.0 NaN NaN NaN\n", + " 2169-02-07 16:43:00 1.0 NaN 1.0 NaN NaN NaN\n", + " 2169-02-07 22:35:00 1.1 NaN 1.1 NaN NaN NaN\n", + " 2169-02-10 05:33:00 1.4 NaN NaN NaN NaN NaN\n", + "199993 2161-11-12 23:14:00 0.9 NaN 0.9 NaN NaN NaN\n", + " 2161-11-13 03:46:00 0.9 NaN 0.9 NaN NaN NaN\n", + "199994 2188-07-07 21:23:00 1.0 NaN 1.0 NaN NaN NaN\n", + " 2188-07-08 03:09:00 0.7 NaN 0.7 NaN NaN NaN\n", + " 2188-07-08 04:13:00 0.6 NaN 0.6 NaN NaN NaN\n", + " 2188-07-08 06:20:00 0.7 NaN 0.7 NaN NaN NaN\n", + "199998 2119-02-20 10:52:00 1.1 1.1 1.1 1.1 NaN NaN\n", + " 2119-02-20 12:36:00 1.9 1.9 1.9 1.9 NaN NaN\n", + " 2119-02-20 13:33:00 2.0 2.0 2.0 2.0 NaN NaN\n", + " 2119-02-20 13:59:00 2.6 2.6 2.6 2.6 NaN NaN\n", + " 2119-02-20 20:43:00 1.3 1.3 1.3 1.3 NaN NaN\n", + "199999 2136-04-04 20:55:00 1.9 NaN NaN NaN NaN NaN\n", + " 2136-04-06 15:29:00 1.8 NaN NaN NaN NaN NaN\n", + "\n", + "[177451 rows x 6 columns]" + ] + }, + "execution_count": 216, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_cleaned" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "df_invalid = df_cleaned.loc[:,df_cleaned.columns.get_level_values('status') == 'unknown']" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "df_invalid.columns.set_labels([0]*df_invalid.columns.size,level='status',inplace=True)\n", + "df_invalid.columns.set_levels(['known'],level='status',inplace=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"10\" halign=\"left\">lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"6\" halign=\"left\">known</th>\n", + " <th colspan=\"4\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">nom</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"2\" halign=\"left\">no_units</th>\n", + " <th colspan=\"2\" halign=\"left\">no_units</th>\n", + " <th colspan=\"2\" halign=\"left\">mmol/L</th>\n", + " <th colspan=\"2\" halign=\"left\">no_units</th>\n", + " <th colspan=\"2\" halign=\"left\">no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>818</th>\n", + " <th>1531</th>\n", + " <th>50813(mmol/L)</th>\n", + " <th>818</th>\n", + " <th>50813</th>\n", + " <th>225668</th>\n", + " <th>818</th>\n", + " <th>1531</th>\n", + " <th>50813(mmol/L)</th>\n", + " <th>818</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>100001</th>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100003</th>\n", + " <th>2150-04-17 19:12:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100006</th>\n", + " <th>2108-04-08 10:58:00</th>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100007</th>\n", + " <th>2145-03-31 00:44:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>3.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2145-04-02 14:10:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100009</th>\n", + " <th>2162-05-17 13:19:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2162-05-17 17:14:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.5</td>\n", + " <td>1.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">100010</th>\n", + " <th>2109-12-10 10:25:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 12:11:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:05:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:58:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100011</th>\n", + " <th>2177-08-29 04:44:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>3.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-08-29 06:55:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.3</td>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100012</th>\n", + " <th>2177-03-14 07:38:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-14 11:42:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.5</td>\n", + " <td>2.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 08:05:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.1</td>\n", + " <td>2.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 14:01:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 21:42:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.8</td>\n", + " <td>1.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100016</th>\n", + " <th>2188-05-24 12:00:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100017</th>\n", + " <th>2103-03-11 05:10:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100018</th>\n", + " <th>2176-08-29 15:29:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 09:23:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 10:19:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 11:29:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 12:40:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100020</th>\n", + " <th>2142-11-30 21:54:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2142-12-03 00:17:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100024</th>\n", + " <th>2170-09-19 10:25:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.4</td>\n", + " <td>1.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-19 16:33:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-20 02:04:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>3.2</td>\n", + " <td>3.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199976</th>\n", + " <th>2182-02-14 11:15:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-16 03:57:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-19 03:59:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-20 03:31:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-21 04:55:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199979</th>\n", + " <th>2182-02-06 09:17:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-06 14:16:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>3.8</td>\n", + " <td>3.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">199981</th>\n", + " <th>2110-09-24 16:34:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-24 20:09:00</th>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-25 06:10:00</th>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>199987</th>\n", + " <th>2175-05-19 16:30:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"6\" valign=\"top\">199988</th>\n", + " <th>2169-01-24 12:48:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 01:35:00</th>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 11:18:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 16:43:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 22:35:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-10 05:33:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199993</th>\n", + " <th>2161-11-12 23:14:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2161-11-13 03:46:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">199994</th>\n", + " <th>2188-07-07 21:23:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 03:09:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 04:13:00</th>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 06:20:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199998</th>\n", + " <th>2119-02-20 10:52:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 12:36:00</th>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:33:00</th>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:59:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 20:43:00</th>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199999</th>\n", + " <th>2136-04-04 20:55:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-06 15:29:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>177451 rows × 10 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label lactate \\\n", + "status known \n", + "variable_type qn nom qn \n", + "units no_units no_units mmol/L \n", + "description 818 1531 50813(mmol/L) 818 50813 225668 \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 NaN NaN NaN NaN 1.9 NaN \n", + "100003 2150-04-17 19:12:00 NaN NaN NaN NaN 1.1 1.1 \n", + "100006 2108-04-08 10:58:00 4.5 NaN NaN NaN 4.5 NaN \n", + "100007 2145-03-31 00:44:00 NaN NaN NaN NaN 3.1 NaN \n", + " 2145-04-02 14:10:00 NaN NaN NaN NaN 1.9 NaN \n", + "100009 2162-05-17 13:19:00 NaN NaN NaN NaN 1.1 1.1 \n", + " 2162-05-17 17:14:00 NaN NaN NaN NaN 1.5 1.5 \n", + "100010 2109-12-10 10:25:00 NaN NaN NaN NaN 0.6 NaN \n", + " 2109-12-10 12:11:00 NaN NaN NaN NaN 0.9 NaN \n", + " 2109-12-10 13:05:00 NaN NaN NaN NaN 1.0 NaN \n", + " 2109-12-10 13:58:00 NaN NaN NaN NaN 0.8 NaN \n", + "100011 2177-08-29 04:44:00 NaN NaN NaN NaN 3.8 NaN \n", + " 2177-08-29 06:55:00 NaN NaN NaN NaN 2.3 2.3 \n", + "100012 2177-03-14 07:38:00 NaN NaN NaN NaN 2.3 NaN \n", + " 2177-03-14 11:42:00 NaN NaN NaN NaN 2.5 2.5 \n", + " 2177-03-15 08:05:00 NaN NaN NaN NaN 2.1 2.1 \n", + " 2177-03-15 14:01:00 NaN NaN NaN NaN 2.6 2.6 \n", + " 2177-03-15 21:42:00 NaN NaN NaN NaN 1.8 1.8 \n", + "100016 2188-05-24 12:00:00 NaN NaN NaN NaN 2.0 NaN \n", + "100017 2103-03-11 05:10:00 1.1 NaN NaN NaN 1.1 NaN \n", + "100018 2176-08-29 15:29:00 NaN NaN NaN NaN 1.3 NaN \n", + " 2176-08-30 09:23:00 NaN NaN NaN NaN 0.9 0.9 \n", + " 2176-08-30 10:19:00 NaN NaN NaN NaN 1.0 1.0 \n", + " 2176-08-30 11:29:00 NaN NaN NaN NaN 0.9 0.9 \n", + " 2176-08-30 12:40:00 NaN NaN NaN NaN 1.1 1.1 \n", + "100020 2142-11-30 21:54:00 NaN NaN NaN NaN 1.1 NaN \n", + " 2142-12-03 00:17:00 NaN NaN NaN NaN 1.0 NaN \n", + "100024 2170-09-19 10:25:00 NaN NaN NaN NaN 1.4 1.4 \n", + " 2170-09-19 16:33:00 NaN NaN NaN NaN 2.6 2.6 \n", + " 2170-09-20 02:04:00 NaN NaN NaN NaN 3.2 3.2 \n", + "... ... ... ... ... ... ... \n", + "199976 2182-02-14 11:15:00 0.8 NaN NaN NaN 0.8 NaN \n", + " 2182-02-16 03:57:00 0.8 NaN NaN NaN 0.8 NaN \n", + " 2182-02-19 03:59:00 0.8 NaN NaN NaN 0.8 NaN \n", + " 2182-02-20 03:31:00 0.7 NaN NaN NaN 0.7 NaN \n", + " 2182-02-21 04:55:00 0.9 NaN NaN NaN 0.9 NaN \n", + "199979 2182-02-06 09:17:00 NaN NaN NaN NaN 1.0 NaN \n", + " 2182-02-06 14:16:00 NaN NaN NaN NaN 3.8 3.8 \n", + "199981 2110-09-24 16:34:00 1.1 1.1 NaN NaN 1.1 NaN \n", + " 2110-09-24 20:09:00 1.0 1.0 NaN NaN 1.0 NaN \n", + " 2110-09-25 06:10:00 1.0 1.0 NaN NaN 1.0 NaN \n", + "199987 2175-05-19 16:30:00 NaN NaN NaN NaN 2.3 NaN \n", + "199988 2169-01-24 12:48:00 NaN NaN NaN NaN 1.0 NaN \n", + " 2169-02-07 01:35:00 1.6 NaN NaN NaN 1.6 NaN \n", + " 2169-02-07 11:18:00 1.0 NaN NaN NaN 1.0 NaN \n", + " 2169-02-07 16:43:00 1.0 NaN NaN NaN 1.0 NaN \n", + " 2169-02-07 22:35:00 1.1 NaN NaN NaN 1.1 NaN \n", + " 2169-02-10 05:33:00 NaN NaN NaN NaN 1.4 NaN \n", + "199993 2161-11-12 23:14:00 0.9 NaN NaN NaN 0.9 NaN \n", + " 2161-11-13 03:46:00 0.9 NaN NaN NaN 0.9 NaN \n", + "199994 2188-07-07 21:23:00 1.0 NaN NaN NaN 1.0 NaN \n", + " 2188-07-08 03:09:00 0.7 NaN NaN NaN 0.7 NaN \n", + " 2188-07-08 04:13:00 0.6 NaN NaN NaN 0.6 NaN \n", + " 2188-07-08 06:20:00 0.7 NaN NaN NaN 0.7 NaN \n", + "199998 2119-02-20 10:52:00 1.1 1.1 NaN NaN 1.1 1.1 \n", + " 2119-02-20 12:36:00 1.9 1.9 NaN NaN 1.9 1.9 \n", + " 2119-02-20 13:33:00 2.0 2.0 NaN NaN 2.0 2.0 \n", + " 2119-02-20 13:59:00 2.6 2.6 NaN NaN 2.6 2.6 \n", + " 2119-02-20 20:43:00 1.3 1.3 NaN NaN 1.3 1.3 \n", + "199999 2136-04-04 20:55:00 NaN NaN NaN NaN 1.9 NaN \n", + " 2136-04-06 15:29:00 NaN NaN NaN NaN 1.8 NaN \n", + "\n", + "label \n", + "status unknown \n", + "variable_type qn nom \n", + "units no_units no_units \n", + "description 818 1531 50813(mmol/L) 818 \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 NaN NaN NaN NaN \n", + "100003 2150-04-17 19:12:00 NaN NaN NaN NaN \n", + "100006 2108-04-08 10:58:00 4.5 NaN NaN NaN \n", + "100007 2145-03-31 00:44:00 NaN NaN NaN NaN \n", + " 2145-04-02 14:10:00 NaN NaN NaN NaN \n", + "100009 2162-05-17 13:19:00 NaN NaN NaN NaN \n", + " 2162-05-17 17:14:00 NaN NaN NaN NaN \n", + "100010 2109-12-10 10:25:00 NaN NaN NaN NaN \n", + " 2109-12-10 12:11:00 NaN NaN NaN NaN \n", + " 2109-12-10 13:05:00 NaN NaN NaN NaN \n", + " 2109-12-10 13:58:00 NaN NaN NaN NaN \n", + "100011 2177-08-29 04:44:00 NaN NaN NaN NaN \n", + " 2177-08-29 06:55:00 NaN NaN NaN NaN \n", + "100012 2177-03-14 07:38:00 NaN NaN NaN NaN \n", + " 2177-03-14 11:42:00 NaN NaN NaN NaN \n", + " 2177-03-15 08:05:00 NaN NaN NaN NaN \n", + " 2177-03-15 14:01:00 NaN NaN NaN NaN \n", + " 2177-03-15 21:42:00 NaN NaN NaN NaN \n", + "100016 2188-05-24 12:00:00 NaN NaN NaN NaN \n", + "100017 2103-03-11 05:10:00 1.1 NaN NaN NaN \n", + "100018 2176-08-29 15:29:00 NaN NaN NaN NaN \n", + " 2176-08-30 09:23:00 NaN NaN NaN NaN \n", + " 2176-08-30 10:19:00 NaN NaN NaN NaN \n", + " 2176-08-30 11:29:00 NaN NaN NaN NaN \n", + " 2176-08-30 12:40:00 NaN NaN NaN NaN \n", + "100020 2142-11-30 21:54:00 NaN NaN NaN NaN \n", + " 2142-12-03 00:17:00 NaN NaN NaN NaN \n", + "100024 2170-09-19 10:25:00 NaN NaN NaN NaN \n", + " 2170-09-19 16:33:00 NaN NaN NaN NaN \n", + " 2170-09-20 02:04:00 NaN NaN NaN NaN \n", + "... ... ... ... ... \n", + "199976 2182-02-14 11:15:00 0.8 NaN NaN NaN \n", + " 2182-02-16 03:57:00 0.8 NaN NaN NaN \n", + " 2182-02-19 03:59:00 0.8 NaN NaN NaN \n", + " 2182-02-20 03:31:00 0.7 NaN NaN NaN \n", + " 2182-02-21 04:55:00 0.9 NaN NaN NaN \n", + "199979 2182-02-06 09:17:00 NaN NaN NaN NaN \n", + " 2182-02-06 14:16:00 NaN NaN NaN NaN \n", + "199981 2110-09-24 16:34:00 1.1 1.1 NaN NaN \n", + " 2110-09-24 20:09:00 1.0 1.0 NaN NaN \n", + " 2110-09-25 06:10:00 1.0 1.0 NaN NaN \n", + "199987 2175-05-19 16:30:00 NaN NaN NaN NaN \n", + "199988 2169-01-24 12:48:00 NaN NaN NaN NaN \n", + " 2169-02-07 01:35:00 1.6 NaN NaN NaN \n", + " 2169-02-07 11:18:00 1.0 NaN NaN NaN \n", + " 2169-02-07 16:43:00 1.0 NaN NaN NaN \n", + " 2169-02-07 22:35:00 1.1 NaN NaN NaN \n", + " 2169-02-10 05:33:00 NaN NaN NaN NaN \n", + "199993 2161-11-12 23:14:00 0.9 NaN NaN NaN \n", + " 2161-11-13 03:46:00 0.9 NaN NaN NaN \n", + "199994 2188-07-07 21:23:00 1.0 NaN NaN NaN \n", + " 2188-07-08 03:09:00 0.7 NaN NaN NaN \n", + " 2188-07-08 04:13:00 0.6 NaN NaN NaN \n", + " 2188-07-08 06:20:00 0.7 NaN NaN NaN \n", + "199998 2119-02-20 10:52:00 1.1 1.1 NaN NaN \n", + " 2119-02-20 12:36:00 1.9 1.9 NaN NaN \n", + " 2119-02-20 13:33:00 2.0 2.0 NaN NaN \n", + " 2119-02-20 13:59:00 2.6 2.6 NaN NaN \n", + " 2119-02-20 20:43:00 1.3 1.3 NaN NaN \n", + "199999 2136-04-04 20:55:00 NaN NaN NaN NaN \n", + " 2136-04-06 15:29:00 NaN NaN NaN NaN \n", + "\n", + "[177451 rows x 10 columns]" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_invalid.join(df_cleaned, how='outer')" + ] + }, + { + "cell_type": "code", + "execution_count": 71, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "df = utils.open_df('data/mimic_data','transformed/{}'.format(label))\n", + "df_cleaned = pipeline.transform(df)\n", + "utils.data_loss(df,df_cleaned)" + ] + }, + { + "cell_type": "code", + "execution_count": 72, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(113L, 0, '0.0%')" + ] + }, + "execution_count": 72, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Secondary/optional transformation" + ] + }, + { + "cell_type": "code", + "execution_count": 99, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload (transformers)\n", + "pipeline1 = Pipeline([\n", + " ('combine_like_columns',transformers.combine_like_cols()),\n", + " ('quantitative_vales_only',transformers.quantitative_only()),\n", + " ('known_col_only',transformers.known_col_only())\n", + " ])\n", + "\n", + "pipeline2 = Pipeline([\n", + " ('combine_like_columns',transformers.combine_like_cols()),\n", + " ('max_col',transformers.max_col_only()),\n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": 74, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(205349L, 20, '0.0583%')" + ] + }, + "execution_count": 74, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_final = pipeline1.transform(df_cleaned)\n", + "utils.data_loss(df,df_final)" + ] + }, + { + "cell_type": "code", + "execution_count": 75, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(205349L, 20, '0.0583%')" + ] + }, + "execution_count": 75, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_final = pipeline2.transform(df_cleaned)\n", + "utils.data_loss(df,df_final)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Handle Categorical columns\n", + "\n", + "0. Standardize category lists\n", + "1. Make sure ordinal & nominal within category list?\n", + "2. Explode nominal\n", + "3. Ordinal to numeric" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "def make_cat_dict(label,cat_codes):\n", + " df = utils.open_df(hdf5_fname, 'transformed/{}'.format(label))\n", + " mimic_cats = df.iloc[:,0].value_counts().sort_index().index.astype(str).tolist()\n", + " return dict(zip(mimic_cats,cat_codes))" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "category_map={}" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>val_numeric</th>\n", + " <th>val_text</th>\n", + " </tr>\n", + " <tr>\n", + " <th>category_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>1</td>\n", + " <td>No motor response</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>2</td>\n", + " <td>Extension to pain</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>3</td>\n", + " <td>Flexion to pain</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>4</td>\n", + " <td>Withdrawal from pain</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>5</td>\n", + " <td>Localizing pain</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>6</td>\n", + " <td>Obeys commands</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>1</td>\n", + " <td>No eye opening</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7</th>\n", + " <td>2</td>\n", + " <td>Eye opening to pain</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8</th>\n", + " <td>3</td>\n", + " <td>Eye opening to verbal command</td>\n", + " </tr>\n", + " <tr>\n", + " <th>9</th>\n", + " <td>4</td>\n", + " <td>Eyes open spontaneously</td>\n", + " </tr>\n", + " <tr>\n", + " <th>10</th>\n", + " <td>1</td>\n", + " <td>No verbal response (>2 yrs); no vocal response...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>11</th>\n", + " <td>2</td>\n", + " <td>Incomprehensible sounds</td>\n", + " </tr>\n", + " <tr>\n", + " <th>12</th>\n", + " <td>3</td>\n", + " <td>Inappropriate words</td>\n", + " </tr>\n", + " <tr>\n", + " <th>13</th>\n", + " <td>4</td>\n", + " <td>Confused</td>\n", + " </tr>\n", + " <tr>\n", + " <th>14</th>\n", + " <td>5</td>\n", + " <td>Oriented</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " val_numeric val_text\n", + "category_id \n", + "0 1 No motor response \n", + "1 2 Extension to pain\n", + "2 3 Flexion to pain\n", + "3 4 Withdrawal from pain \n", + "4 5 Localizing pain\n", + "5 6 Obeys commands\n", + "6 1 No eye opening\n", + "7 2 Eye opening to pain\n", + "8 3 Eye opening to verbal command\n", + "9 4 Eyes open spontaneously\n", + "10 1 No verbal response (>2 yrs); no vocal response...\n", + "11 2 Incomprehensible sounds\n", + "12 3 Inappropriate words\n", + "13 4 Confused\n", + "14 5 Oriented" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_dict.tables.categories" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "label = data_dict.labels.GLASGOW_COMA_SCALE_MOTOR\n", + "category_map[label] = make_cat_dict(label,range(0,6))\n", + "label = data_dict.labels.GLASGOW_COMA_SCALE_EYE_OPENING\n", + "category_map[label] = make_cat_dict(label,range(6,10))\n", + "label = data_dict.labels.GLASGOW_COMA_SCALE_VERBAL\n", + "category_map[label] = make_cat_dict(label,[10] + range(10,15))" + ] + }, + { + "cell_type": "code", + "execution_count": 63, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'glasgow coma scale eye opening': {'1 No Response': 6,\n", + " '2 To pain': 7,\n", + " '3 To speech': 8,\n", + " '4 Spontaneously': 9},\n", + " 'glasgow coma scale motor': {'1 No Response': 0,\n", + " '2 Abnorm extensn': 1,\n", + " '3 Abnorm flexion': 2,\n", + " '4 Flex-withdraws': 3,\n", + " '5 Localizes Pain': 4,\n", + " '6 Obeys Commands': 5},\n", + " 'glasgow coma scale verbal': {'1 No Response': 10,\n", + " '1.0 ET/Trach': 10,\n", + " '2 Incomp sounds': 11,\n", + " '3 Inapprop words': 12,\n", + " '4 Confused': 13,\n", + " '5 Oriented': 14}}" + ] + }, + "execution_count": 63, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "category_map" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "<module 'transformers' from 'transformers.pyc'>" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "reload(utils)\n", + "reload(transformers)" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>glasgow coma scale verbal</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>ord</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>723</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>1.0 ET/Trach</th>\n", + " <td>444357</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5 Oriented</th>\n", + " <td>379668</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4 Confused</th>\n", + " <td>82434</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1 No Response</th>\n", + " <td>20836</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2 Incomp sounds</th>\n", + " <td>18007</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3 Inapprop words</th>\n", + " <td>5611</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label glasgow coma scale verbal\n", + "status known\n", + "variable_type ord\n", + "units no_units\n", + "description 723\n", + "1.0 ET/Trach 444357\n", + "5 Oriented 379668\n", + "4 Confused 82434\n", + "1 No Response 20836\n", + "2 Incomp sounds 18007\n", + "3 Inapprop words 5611" + ] + }, + "execution_count": 58, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_gcs = utils.open_df(hdf5_fname, 'transformed/{}'.format(data_dict.labels.GLASGOW_COMA_SCALE_VERBAL))\n", + "df_gcs = standard_pipeline.transform(df_gcs)\n", + "df_gcs.apply(lambda x: x.value_counts())" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>glasgow coma scale verbal</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>ord</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>723</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>465193</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5 Oriented</th>\n", + " <td>379668</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>82434</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>18007</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>5611</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label glasgow coma scale verbal\n", + "status known\n", + "variable_type ord\n", + "units no_units\n", + "description 723\n", + "1 465193\n", + "5 Oriented 379668\n", + "4 82434\n", + "2 18007\n", + "3 5611" + ] + }, + "execution_count": 59, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "transformer = transformers.standardize_categories(data_dict,category_map,use_numeric=True)\n", + "df_gcs = transformer.transform(df_gcs)\n", + "df_gcs.apply(lambda x: x.value_counts())" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"2\" halign=\"left\">glasgow coma scale verbal</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " <th>unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>ord</th>\n", + " <th>nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>no_units</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>723</th>\n", + " <th>723</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>465193.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>18007.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>5611.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>82434.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5 Oriented</th>\n", + " <td>NaN</td>\n", + " <td>379668.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label glasgow coma scale verbal \n", + "status known unknown\n", + "variable_type ord nom\n", + "units no_units no_units\n", + "description 723 723\n", + "1 465193.0 NaN\n", + "2 18007.0 NaN\n", + "3 5611.0 NaN\n", + "4 82434.0 NaN\n", + "5 Oriented NaN 379668.0" + ] + }, + "execution_count": 60, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "transformer2 = transformers.split_bad_categories(data_dict,use_numeric=True)\n", + "transformer2.transform(df_gcs).apply(lambda x: x.value_counts())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Unified pipeline" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import icu_data_defs\n", + "from sklearn.pipeline import Pipeline\n", + "import transformers\n", + "from units import MedicalUreg\n", + "from constants import variable_type\n", + "import utils\n", + "import mimic\n", + "import warnings\n", + "warnings.filterwarnings('ignore')" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(transformers)\n", + "reload(utils)\n", + "reload(mimic)\n", + "hdf5_fname = 'data/mimic_data'\n", + "\n", + "#get all labels\n", + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n", + "ureg = MedicalUreg('config/medical_units.txt')\n", + "\n", + "agg_func = lambda x:x.iloc[0]\n", + "var_types_to_keep = [variable_type.QUANTITATIVE,variable_type.ORDINAL]\n", + "category_map = {\n", + " data_dict.labels.GLASGOW_COMA_SCALE_EYE_OPENING: {\n", + " '1 No Response': 6,\n", + " '2 To pain': 7,\n", + " '3 To speech': 8,\n", + " '4 Spontaneously': 9\n", + " },\n", + " data_dict.labels.GLASGOW_COMA_SCALE_MOTOR: {\n", + " '1 No Response': 0,\n", + " '2 Abnorm extensn': 1,\n", + " '3 Abnorm flexion': 2,\n", + " '4 Flex-withdraws': 3,\n", + " '5 Localizes Pain': 4,\n", + " '6 Obeys Commands': 5\n", + " },\n", + " data_dict.labels.GLASGOW_COMA_SCALE_VERBAL: {\n", + " '1 No Response': 10,\n", + " '1.0 ET/Trach': 10,\n", + " '2 Incomp sounds': 11,\n", + " '3 Inapprop words': 12,\n", + " '4 Confused': 13,\n", + " '5 Oriented':14\n", + " }\n", + "}\n", + "\n", + "mimic_transform = Pipeline([\n", + " ('clean',mimic.clean_extract()),\n", + " ('unstack',mimic.unstacker()),\n", + " ('add_level',transformers.add_level(None,'label',axis=1)),\n", + "])\n", + "\n", + "standard_pipeline = Pipeline([\n", + " ('drop_small_columns',transformers.remove_small_columns(threshold=5)),\n", + " ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func)),\n", + " ('split_dtype',transformers.split_dtype()),\n", + " ('standardize_columns',transformers.standardize_columns(data_dict,ureg)),\n", + " ('standardize_categories',transformers.standardize_categories(data_dict,category_map)),\n", + " ('split_bad_categories',transformers.split_bad_categories(data_dict))\n", + " ])\n", + "\n", + "cleaning_pipeline = Pipeline([\n", + " ('drop_small_columns',transformers.remove_small_columns(threshold=50)),\n", + " ('combine_like_columns',transformers.combine_like_cols()),\n", + " ('quantitative_only',transformers.filter_var_type(var_types_to_keep)),\n", + " ('known_col_only',transformers.known_col_only()),\n", + "# ('max_col',transformers.max_col_only()) \n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>817373.000000</td>\n", + " <td>817373</td>\n", + " <td>771272.000000</td>\n", + " <td>817373</td>\n", + " <td>817373.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>NaN</td>\n", + " <td>536890</td>\n", + " <td>446614.000000</td>\n", + " <td>6</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>NaN</td>\n", + " <td>2159-09-30 01:00:00</td>\n", + " <td>99.999996</td>\n", + " <td>mL/hour</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>NaN</td>\n", + " <td>9</td>\n", + " <td>25385.000000</td>\n", + " <td>719922</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>first</th>\n", + " <td>NaN</td>\n", + " <td>2100-06-08 04:23:00</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>last</th>\n", + " <td>NaN</td>\n", + " <td>2209-08-07 14:27:00</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>150437.603989</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>222346.358593</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>28720.645234</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>23242.543767</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>100001.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>4647.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>125824.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>225158.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>150715.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>225158.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>175466.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>225158.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>199984.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>225158.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units \\\n", + "count 817373.000000 817373 771272.000000 817373 \n", + "unique NaN 536890 446614.000000 6 \n", + "top NaN 2159-09-30 01:00:00 99.999996 mL/hour \n", + "freq NaN 9 25385.000000 719922 \n", + "first NaN 2100-06-08 04:23:00 NaN NaN \n", + "last NaN 2209-08-07 14:27:00 NaN NaN \n", + "mean 150437.603989 NaN NaN NaN \n", + "std 28720.645234 NaN NaN NaN \n", + "min 100001.000000 NaN NaN NaN \n", + "25% 125824.000000 NaN NaN NaN \n", + "50% 150715.000000 NaN NaN NaN \n", + "75% 175466.000000 NaN NaN NaN \n", + "max 199984.000000 NaN NaN NaN \n", + "\n", + " itemid \n", + "count 817373.000000 \n", + "unique NaN \n", + "top NaN \n", + "freq NaN \n", + "first NaN \n", + "last NaN \n", + "mean 222346.358593 \n", + "std 23242.543767 \n", + "min 4647.000000 \n", + "25% 225158.000000 \n", + "50% 225158.000000 \n", + "75% 225158.000000 \n", + "max 225158.000000 " + ] + }, + "execution_count": 26, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "label = 'normal saline'\n", + "df = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n", + "df.describe(include='all')" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "metadata": { + "collapsed": false, + "scrolled": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"17\" halign=\"left\">normal saline</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mL/hour</th>\n", + " <th>mL</th>\n", + " <th>ml</th>\n", + " <th>mL/hour</th>\n", + " <th>no_units</th>\n", + " <th>ml</th>\n", + " <th>mL</th>\n", + " <th>ml</th>\n", + " <th>mL/min</th>\n", + " <th>L</th>\n", + " <th colspan=\"2\" halign=\"left\">ml</th>\n", + " <th>no_units</th>\n", + " <th>ml</th>\n", + " <th>mL/hour</th>\n", + " <th>ml</th>\n", + " <th>mL/hour</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>225158</th>\n", + " <th>225158</th>\n", + " <th>30190</th>\n", + " <th>30190</th>\n", + " <th>30190</th>\n", + " <th>225158</th>\n", + " <th>30190</th>\n", + " <th>4647</th>\n", + " <th>225158</th>\n", + " <th>225158</th>\n", + " <th>6190</th>\n", + " <th>44053</th>\n", + " <th>44053</th>\n", + " <th>44440</th>\n", + " <th>44440</th>\n", + " <th>41913</th>\n", + " <th>41913</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>719400.000000</td>\n", + " <td>39402.0</td>\n", + " <td>5167.0</td>\n", + " <td>259.0</td>\n", + " <td>160.0</td>\n", + " <td>6730.000000</td>\n", + " <td>50.0</td>\n", + " <td>8</td>\n", + " <td>80.0</td>\n", + " <td>1.0</td>\n", + " <td>1</td>\n", + " <td>3.0</td>\n", + " <td>2.0</td>\n", + " <td>5.0</td>\n", + " <td>1.0</td>\n", + " <td>2.0</td>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>443511.000000</td>\n", + " <td>147.0</td>\n", + " <td>243.0</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>4233.000000</td>\n", + " <td>1.0</td>\n", + " <td>1</td>\n", + " <td>6.0</td>\n", + " <td>1.0</td>\n", + " <td>1</td>\n", + " <td>2.0</td>\n", + " <td>1.0</td>\n", + " <td>2.0</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>99.999996</td>\n", + " <td>500.0</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>49.999999</td>\n", + " <td>0.0</td>\n", + " <td>given</td>\n", + " <td>100.0</td>\n", + " <td>1000.0</td>\n", + " <td>given</td>\n", + " <td>17.0</td>\n", + " <td>0.0</td>\n", + " <td>37.0</td>\n", + " <td>0.0</td>\n", + " <td>20.0</td>\n", + " <td>0.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>25193.000000</td>\n", + " <td>11589.0</td>\n", + " <td>651.0</td>\n", + " <td>259.0</td>\n", + " <td>160.0</td>\n", + " <td>352.000000</td>\n", + " <td>50.0</td>\n", + " <td>8</td>\n", + " <td>60.0</td>\n", + " <td>1.0</td>\n", + " <td>1</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>3.0</td>\n", + " <td>1.0</td>\n", + " <td>2.0</td>\n", + " <td>1.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label normal saline \\\n", + "units mL/hour mL ml mL/hour no_units ml \n", + "description 225158 225158 30190 30190 30190 225158 \n", + "count 719400.000000 39402.0 5167.0 259.0 160.0 6730.000000 \n", + "unique 443511.000000 147.0 243.0 1.0 1.0 4233.000000 \n", + "top 99.999996 500.0 1.0 0.0 0.0 49.999999 \n", + "freq 25193.000000 11589.0 651.0 259.0 160.0 352.000000 \n", + "\n", + "label \\\n", + "units mL ml mL/min L ml no_units ml \n", + "description 30190 4647 225158 225158 6190 44053 44053 44440 \n", + "count 50.0 8 80.0 1.0 1 3.0 2.0 5.0 \n", + "unique 1.0 1 6.0 1.0 1 2.0 1.0 2.0 \n", + "top 0.0 given 100.0 1000.0 given 17.0 0.0 37.0 \n", + "freq 50.0 8 60.0 1.0 1 2.0 2.0 3.0 \n", + "\n", + "label \n", + "units mL/hour ml mL/hour \n", + "description 44440 41913 41913 \n", + "count 1.0 2.0 1.0 \n", + "unique 1.0 1.0 1.0 \n", + "top 0.0 20.0 0.0 \n", + "freq 1.0 2.0 1.0 " + ] + }, + "execution_count": 27, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "mimic_transform.set_params(add_level__level_val=label)\n", + "df_tr = mimic_transform.transform(df)\n", + "df_tr.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "((770238, 17), (504923, 9), 265320L, 4, '0.0202% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"9\" halign=\"left\">normal saline</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " <th>unknown</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th>nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mL/hr</th>\n", + " <th colspan=\"2\" halign=\"left\">mL</th>\n", + " <th>mL/hr</th>\n", + " <th>no_units</th>\n", + " <th colspan=\"2\" halign=\"left\">mL</th>\n", + " <th>mL/min</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>225158(mL/hour)</th>\n", + " <th>225158</th>\n", + " <th>30190(ml)</th>\n", + " <th>30190(mL/hour)</th>\n", + " <th>30190</th>\n", + " <th>225158(ml)</th>\n", + " <th>30190</th>\n", + " <th>225158</th>\n", + " <th>4647(ml)</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>456226.000000</td>\n", + " <td>39261.000000</td>\n", + " <td>5068.000000</td>\n", + " <td>258.0</td>\n", + " <td>157.0</td>\n", + " <td>4844.000000</td>\n", + " <td>50.0</td>\n", + " <td>80.000000</td>\n", + " <td>8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>given</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>75.669716</td>\n", + " <td>471.560439</td>\n", + " <td>4.255024</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>128.094818</td>\n", + " <td>0.0</td>\n", + " <td>103.312500</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>217.566524</td>\n", + " <td>372.084861</td>\n", + " <td>8.418981</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>260.186534</td>\n", + " <td>0.0</td>\n", + " <td>55.885358</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-906.000000</td>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.000000</td>\n", + " <td>0.0</td>\n", + " <td>0.500000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>6.000000</td>\n", + " <td>200.000000</td>\n", + " <td>0.850000</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>9.310294</td>\n", + " <td>0.0</td>\n", + " <td>100.000000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>15.000000</td>\n", + " <td>500.000000</td>\n", + " <td>1.100000</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>25.000000</td>\n", + " <td>0.0</td>\n", + " <td>100.000000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>62.255889</td>\n", + " <td>500.000000</td>\n", + " <td>2.400000</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>100.000001</td>\n", + " <td>0.0</td>\n", + " <td>100.000000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>51947.999400</td>\n", + " <td>11000.000000</td>\n", + " <td>117.000000</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>5000.000160</td>\n", + " <td>0.0</td>\n", + " <td>300.000000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label normal saline \\\n", + "status known \n", + "variable_type qn \n", + "units mL/hr mL mL/hr \n", + "description 225158(mL/hour) 225158 30190(ml) 30190(mL/hour) \n", + "count 456226.000000 39261.000000 5068.000000 258.0 \n", + "unique NaN NaN NaN NaN \n", + "top NaN NaN NaN NaN \n", + "freq NaN NaN NaN NaN \n", + "mean 75.669716 471.560439 4.255024 0.0 \n", + "std 217.566524 372.084861 8.418981 0.0 \n", + "min -906.000000 0.000000 0.000000 0.0 \n", + "25% 6.000000 200.000000 0.850000 0.0 \n", + "50% 15.000000 500.000000 1.100000 0.0 \n", + "75% 62.255889 500.000000 2.400000 0.0 \n", + "max 51947.999400 11000.000000 117.000000 0.0 \n", + "\n", + "label \n", + "status unknown known unknown \n", + "variable_type qn qn qn nom \n", + "units no_units mL mL/min no_units \n", + "description 30190 225158(ml) 30190 225158 4647(ml) \n", + "count 157.0 4844.000000 50.0 80.000000 8 \n", + "unique NaN NaN NaN NaN 1 \n", + "top NaN NaN NaN NaN given \n", + "freq NaN NaN NaN NaN 8 \n", + "mean 0.0 128.094818 0.0 103.312500 NaN \n", + "std 0.0 260.186534 0.0 55.885358 NaN \n", + "min 0.0 0.000000 0.0 0.500000 NaN \n", + "25% 0.0 9.310294 0.0 100.000000 NaN \n", + "50% 0.0 25.000000 0.0 100.000000 NaN \n", + "75% 0.0 100.000001 0.0 100.000000 NaN \n", + "max 0.0 5000.000160 0.0 300.000000 NaN " + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_cln1 = standard_pipeline.transform(df_tr)\n", + "print utils.data_loss(df_tr,df_cln1)\n", + "df_cln1.describe(include='all')" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "this step: ((504923, 9), (504874, 2), 295L, 1, '0.0051% records')\n", + "overall: ((770238, 17), (504874, 2), 265615L, 5, '0.0253% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"2\" halign=\"left\">normal saline</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>49173.000000</td>\n", + " <td>456484.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>389.563178</td>\n", + " <td>75.626948</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>380.287765</td>\n", + " <td>217.512467</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>-906.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>100.000000</td>\n", + " <td>6.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>250.000000</td>\n", + " <td>15.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>500.000000</td>\n", + " <td>62.204886</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>11000.000000</td>\n", + " <td>51947.999400</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label normal saline \n", + "status known \n", + "variable_type qn \n", + "units mL mL/hr\n", + "count 49173.000000 456484.000000\n", + "mean 389.563178 75.626948\n", + "std 380.287765 217.512467\n", + "min 0.000000 -906.000000\n", + "25% 100.000000 6.000000\n", + "50% 250.000000 15.000000\n", + "75% 500.000000 62.204886\n", + "max 11000.000000 51947.999400" + ] + }, + "execution_count": 36, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_cln2 = cleaning_pipeline.transform(df_cln1)\n", + "print 'this step:',utils.data_loss(df_cln1,df_cln2)\n", + "print 'overall:',utils.data_loss(df_tr,df_cln2)\n", + "df_cln2.describe(include='all')" + ] + }, + { + "cell_type": "code", + "execution_count": 42, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "array([[<matplotlib.axes._subplots.AxesSubplot object at 0x0000000043A236D8>,\n", + " <matplotlib.axes._subplots.AxesSubplot object at 0x0000000029BE0C18>]], dtype=object)" + ] + }, + "execution_count": 42, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAgAAAAFeCAYAAADzFKfgAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAAIABJREFUeJzt3X9clfX9//Hn+QGiHPBHYbd0DoyJpTMT0Fn+GE1Z2Nxn\nlVDg1Jrmr1Xb1HlDWop+0sA2P61ltvZpy88HW2K/1ubWKtJwMpdKN1xSWl/b1KwZoSUcCQ6c9/cP\nP5yJggeBA9r7cb/dvN0813W9r9f7fTjviyfnXOe6HMYYIwAAYBVnV3cAAAB0PgIAAAAWIgAAAGAh\nAgAAABYiAAAAYCECAAAAFrpoA8CaNWtUUlKitWvXavr06V3dnSauvPJKffrpp+3ezwsvvKB58+ZJ\nku677z7t2LGjXX3atWvXObeZPn261q5dqyNHjmjEiBFtrtWRvvGNb+h3v/tdl7TfuXOnrrzyyjbX\nbkv7tWvXauXKlefc12uvvaZHH320zf26UDGnz79PzOnzcyHN6UZPPfWUnnrqKeXk5OjJJ588rz60\n91hwUQaAPXv26MCBAxozZowiIiIUGRnZ1V1qwuFwdPg+V65cqWuvvbbN7bt3767u3bsH3aZHjx6S\nQjOGtmhNv0PVPiIiol2129u+pX1NmDBBpaWl2rdvX4fs+0LAnD5/zOnzdyHN6UZbtmzRxIkT29SH\n9h4L3G1q1cUeeeSRwF8IQ4cOVeO1jL7xjW/olltu0Y4dO/TRRx9p0qRJWrx4sSSpsLBQGzZskMvl\n0iWXXKJly5YpNjZWOTk5+vTTT/XBBx8oJSVFn3zyibp166a33npLlZWVSktLU58+fbRlyxZVVlZq\n5cqV+trXvqZ//vOf+s///E+dPHlSH3/8sa666io99NBDCg8PV0vXVvrFL36h1157TWFhYerVq5fy\n8/N16aWX6tlnn9WmTZtUX1+vTz/9VHPmzFFmZmaTttOnT9f06dM1dOhQ3XHHHfr617+uPXv26MSJ\nE/rhD3+oG2+8UZL0y1/+Uq+88oqMMerfv79yc3MVExOj6667TgkJCed8XpOSkjRs2LAmyw4cOKA5\nc+YoJydHV111VYu16+vrlZ+frx07dsjlcmn48OFasmSJnnvuOb311lv66U9/qvr6en3ta1/TT37y\nE91yyy168803lZeXp8WLF+uhhx7SgAED9N5778nn82nZsmUaNWqURo0apSFDhpyz3y+88IJefvll\n/fKXvzzr8entH374YW3evFl9+vRRYmKi9u7dq4KCAuXk5CgyMlLvvvuu/vWvf+mKK67QQw89pK98\n5SsaO3bsOWuf/rP55je/2eTx2LFjA+1zcnJa9bpqyZl9SU9P19q1a7V27dqg/bsYMKeZ06ezYU5L\nUlVVlbxery677DJJ0ptvvqmXX35ZlZWVGjRokP7rv/5LERERGjZsmCZMmKD9+/dr1apVHXcsMBeZ\nEydOmGuuucb4fL6z1l1//fVm9erVxhhj/vWvf5mrr77afPDBB+avf/2r+eY3v2mOHz9ujDHm+eef\nNzfeeKMxxpglS5aY733ve4F9LFmyxNx2222moaHBVFRUmMGDB5sNGzYYY4z5n//5HzNz5kxjjDGr\nV682v//9740xxvh8PvPtb3/bvPLKK8YYYwYPHhyo1eijjz4ySUlJpq6uzhhjzJNPPmmKioqM1+s1\nt912m/n000+NMcaUlZWZESNGBPo5d+5cY4wx06ZNMy+//LL54IMPzODBg83rr79ujDHm5ZdfNtdf\nf70xxpgXXnjBLFiwwDQ0NBhjjCksLDSzZ88+7+f4gw8+MCNGjDDvvvuuSU1NNX/7298Cy1uq/fDD\nD5t77rknUDsnJ8fk5uaaI0eOmDFjxhhjjHnjjTfM2LFjzaJFi4wxxjz44IPmiSeeMG+88YYZOnSo\n2bdvnzHGmN/85jdm2rRpre7v6c9Tc48b+zp58mRz8uRJU19fb2bPnm2mT59ujDn1M8/KyjI+n8/4\nfD5z8803m+eff77V9Rt/Ni09bqzRmtfVI488Yu6///6gNaurq83w4cNNbW1tq/t5oWJOM6fPZMuc\n/sMf/mDWrVsX2N+tt95qamtrTUNDg7n55pvNiy++aIw59fprfG2eqT3HgovuI4CDBw+qb9++crub\nf/NiwoQJkqTLLrtMl1xyiT777DNt375dkyZNUq9evSRJN998sz7++GMdOXJEkpSYmNhkH9dff72c\nTqcuvfRSde/eXePGjZMkffnLX9Znn30mSVq8eLF69+6tJ554QsuXL1dFRYW8Xm+L/b7ssst01VVX\n6eabb9bq1as1ePBgTZgwQT169NAvf/lLbd26VQ8//LAee+wx1dTUnPM5CAsL09e//nVJ0pAhQwJ9\nev3117Vnzx7dcsstuummm7RhwwYdPHjwnPtqSV1dnW6//XZdddVVTVJsS7X/8pe/KCsrS07nqZfU\n9OnTtW3bNvXr10+XXXaZ3nrrLf3lL3/R3LlztXPnTkmnPr9qTNj9+vXT4MGDz9pvR3njjTeUmpqq\n7t27y+Vy6dZbb22yfty4cXK73XK73UpISOjw+lLrXletFRkZKY/HE3gNX8yY08zptvgizOmioqLA\n61s69VoPDw+X0+lUQkKCjh07FliXlJTU7D7acyy46AKA0+lUQ0NDi+sjIiKaPDbGyO/3n7Wd3+9X\nfX29JJ31eWN4eHiTx80dmBYsWKBNmzapf//++t73vhf0LS2Hw6GCggLl5+erd+/eysvL0wMPPKCj\nR4/qpptu0kcffaTk5GT96Ec/Oud+pFMT9vT9mv97e9Lv92v27Nn63e9+p9/97nd67rnn9NRTTwXd\nX0seffRRvf3223r11VdbVft0DQ0Ngef3m9/8poqLi1VSUqK0tDT169dPf/rTn9S9e3cNGDBAktSt\nW7dm99saZ3626fP5ztqmW7duTfZ5+jikpq+bttQ/ffvm6kute12dj4aGBrlcrnbt40LAnGZOn8mG\nOe3z+XTw4MEmH+O09LOQFDiXozltPRZcdAFgwIABqqysVF1dXavbjBs3Ti+99FIgTT333HPq3bu3\nYmNj29yPkpIS3XXXXZo0aZKMMdqzZ885D2L79u3T5MmTFR8frzlz5uiOO+7Qvn379NZbb6lPnz6a\nP3++xowZo61bt0rSOV+sLa0bO3asnnnmGVVXV0uSfv7znys7O7tN4wsLC9OIESO0atUq5ebmqrKy\nMmjtp59+WvX19fL7/frtb3+rMWPGSJImTpyozZs3y+/369JLL9V1112nn/70p0pLS2tT387Uu3dv\nvfvuu6qrq1N9fb22bNly1jYpKSl66aWXVFVVJb/frxdffLFDaktSnz59tHfvXknSoUOHtH///nbt\nrzUHqurqatXW1uryyy9vV60LAXOaOX0mG+b0jh07gp4j0BrtORZcdCcBRkVFKTk5WW+88Ubg7ZZG\nZ6bGxsfXXXedbr/9dt1+++2STr24Hn/88VbVa+nM2QULFuiuu+5Sr1691L17d40aNUqHDh1qsc2V\nV16pSZMm6ZZbblGPHj3UvXt33XfffYqLi9Nzzz2nG264QZGRkRo2bJj69Olz1tt8p++zpT5lZGTo\n448/1m233San06nLL79ceXl5Z2130003adWqVRo6dGjQcY8aNUrf+ta3dO+992rZsmUt1v7+97+v\nBx98UDfddJMaGhp09dVXa+nSpZKk+Ph4ORyOwBnPY8eO1WOPPabU1NQW6zdnzpw5ysrK0vXXX99k\n+dixYzVq1CilpaWpb9+++trXvnbWhB01apRmzJihrKwsRUREqF+/fudVe+/evbrvvvua/frR/Pnz\ntWTJEr3++uu64oorNGrUqKD7O9cZ2Zs2bdILL7wQeDx48GA9/fTTTbbZvn27rr/++rP+6rkYMaeZ\n0zbO6cGDB2vy5Mmt6uu59t2uY8F5nzVwAXjzzTfNnDlzurobF62HHnrIvPPOO13djfO2adMm8+qr\nr3bIvv785z8HThhqrTNPQupKM2bMMPv37+/qbnQY5nT7MKcv/jndVu05FgT9CMAYo9zcXGVmZmrG\njBk6fPhwk/VbtmxRenq6MjMz9cwzz7SqTV5engoLCwOPN23apClTpigzM1Ovv/560NAyYsQIXXHF\nFdq+fXtrMg7O0L9//3ZdDKOruN3us/5S6CxHjx5VVlZWl9Q+U1FRkUaOHBn0K2Dn0pHz+tChQ5o6\ndaqmTZumFStWBPaxfv163XrrrbrtttsCFyupra3VD37wA333u9/V3Llzdfz4cUnM6fZiTp+/C2lO\nt1W7jwXBEsIrr7xilixZYow59XWW+fPnB9b5fD6TmppqqqqqTF1dnZkyZYqprKxssU1lZaW58847\nTWpqqtm4caMxxpiKigozefJk4/P5TFVVlZk8eXLgazUAQqMj5/W8efPMrl27jDHGLFu2zLz66qvm\n0KFDZsqUKYF9ZmZmmv3795snn3zSPPLII8YYY/74xz+alStXdsp4AZwt6DsApaWlgc/lhg8fHjgx\nQjp1QYnY2Fh5PB6FhYUpOTlZO3fuPKtNeXm5JOnkyZO655579B//8R+Bffz9739XUlKS3G63PB6P\n4uLi2n3CBYBz68h5XV5eruTkZEnS+PHjtWPHDvXr109PPPFEYJ8NDQ3q1q2bSktLNX78+CbbAuga\nQQNAdXW1oqKiAo/dbnfg6yFnruvRo0fgykanL3e5XPL7/frSl76kq6+++pz7b9wHgNDpqHnd0NDQ\n5AznyMhIVVVVyeVyBb6jv3r1ag0ZMkSxsbGqrq6Wx+MJbNt4djuAzhc0AHg8niYXw/D7/YELQ3g8\nniYT2Ov1qmfPnuds09z+z9xHdHT0OftkzuP7nADO1lHz2uVyNZnbp8/furo6LVq0SDU1NcrNzT2r\n7pmBoiXMdyA0gn4NMDExUVu3blVaWprKysqanGwQHx+vgwcP6sSJE4qIiNDu3bs1a9YsSWqxzZmu\nvvpq/fznP1ddXZ1qa2v1/vvva9CgQefsk8PhUEVF171LEBMT1aX1L4Q+2F7/QuhDTEzwX54t6ch5\nPWTIEO3atUsjR47Utm3bNHr0aEmnvkp17bXX6s4772xSt7i4WMOGDVNxcXHgo4Nz6ez53tk/1y9y\nvS/y2Dq7Xnvme0uCBoDU1FSVlJQEbmSRl5enzZs3q6amRhkZGcrJydHMmTNljFF6err69u3bbJuW\nXHrppZo+fbqmTp0qY4wWLlx41tWVAHSsjpzX2dnZWrp0qXw+n+Lj45WWlqaioiLt3r1bPp9PxcXF\ncjgcWrRokbKyspSdna2pU6cqPDxca9as6bLnALCdw1yk76919V9e/PVpd/0LoQ+h+IvgQvVF/avu\ni17vizy2zq4Xivl+0V0KGAAAtB8BAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAA\nCxEAAACwEAEAAAALEQAAALAQAQAAAAsFvRsgAHzRPfviS3r7/X9JkrpFhKn2c1+r245JHKQJXx8b\nqq4BIUMAAGC9f35YqX/Wxp56UHt+bfsd+rDjOwR0Aj4CAADAQgQAAAAsRAAAAMBCBAAAACxEAAAA\nwEIEAAAALEQAAADAQgQAAAAsRAAAAMBCBAAAACxEAAAAwEIX5b0AMmf/RGHde7VrHyc/O6pHV98n\nl8vVQb0CAODicVEGgEpfb0VED2rXPj7318oY00E9AgDg4sJHAAAAWIgAAACAhQgAAABYiAAAAICF\nCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgA\nAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAA\nWIgAAACAhdzBNjDGaPny5dq/f7/Cw8O1atUqDRgwILB+y5YtWrdundxut6ZMmaKMjIwW2xw6dEhL\nliyR0+nUoEGDlJubK0n6zW9+o82bN8vlcmnu3LmaOHFi6EYMAACCvwNQVFSkuro6bdy4UYsWLVJe\nXl5gXX19vfLz87V+/XoVFBSosLBQx44da7FNXl6eFi5cqA0bNsjv96uoqEhVVVUqKCjQM888o1//\n+td64IEHQjdaAAAgqRUBoLS0VOPGjZMkDR8+XHv37g2sO3DggGJjY+XxeBQWFqbk5GTt3LnzrDbl\n5eWSpPLyciUnJ0uSxo8frx07dqh79+7q37+/vF6vTp48KaeTTyUAAAi1oB8BVFdXKyoq6t8N3G75\n/X45nc6z1vXo0UNVVVXyer1NlrtcLjU0NMgYE1gWGRmpqqoqSdJll12mG2+8UcYYzZkzp0MGBgAA\nWhY0AHg8Hnm93sDjxl/+jeuqq6sD67xer3r27NlsG5fL1eSve6/Xq+joaG3btk2ffPKJtm7dKmOM\nZs2apcTERA0bNqxDBtgSp9OhmJgoud1Bn4JmxcREBd8oxLq6D7bXv1D6AABtEfS3X2JiorZu3aq0\ntDSVlZUpISEhsC4+Pl4HDx7UiRMnFBERod27d2vWrFmS1GybIUOGaNeuXRo5cqS2bdum0aNHKzo6\nWhEREQoLC5MkRUVFBd4ZCCW/36iioqpNASAmJkoVFaHv44XcB9vrXwh9IHwAaI+gv/1SU1NVUlKi\nzMxMSadO5Nu8ebNqamqUkZGhnJwczZw5U8YYpaenq2/fvs22kaTs7GwtXbpUPp9P8fHxSktLk8Ph\n0I4dO3TrrbfK6XQqKSlJ1113XQiHDAAAggYAh8OhFStWNFk2cODAwP9TUlKUkpIStI0kxcXFqaCg\n4Kzl99xzj+65557W9hkAALQTp9wDAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGCh\ntl0HF8BFrTNu8y1Jx44dU1ZWlv7whz8oPDxc0qkbgcXFxUmSRowYoQULFnTq2AGcQgAALHT6Lbv3\n7NmjvLw8rVu3TtK/b/P9/PPPq1u3bsrKytKECRNUWlrabJvG23wnJycrNzdXRUVFmjhxorZv3641\na9aosrIyUPfQoUMaOnSoHnvssa4aOoD/w0cAgIVCfZtv6dRdQNevX6+ePXsG9r13714dPXpUM2bM\n0Ny5c/WPf/yjU8YL4Gy8AwBYqDNu833ttddKUpP1ffv21dy5c3XDDTeotLRUixcv1rPPPhuycQJo\nGQEAsFCob/N9OofDEfj/V7/6VblcLklSUlKSKioqOnZgAFqNAABYKNS3+T7d6e8ArF27Vr169dKd\nd96pffv26fLLL29Vf0N96+Pu3cOkz9rWNjKyW7v719m3du7Mel/ksXVFvY5EAAAsFOrbfJ/u9HcA\n5syZo8WLF6u4uFhutzuwj2AqKqo6Ytgtqqnxtbmt11vbrv7FxESFfHxdVe+LPLbOrheKoEEAACzU\nGbf5bvTaa68F/h8dHa3HH3+8jb0G0JH4FgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAh\nAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIA\nAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAA\nFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYi\nAAAAYCF3sA2MMVq+fLn279+v8PBwrVq1SgMGDAis37Jli9atWye3260pU6YoIyOjxTaHDh3SkiVL\n5HQ6NWjQIOXm5kqSiouLtW7dOknS0KFDtWzZshANFwAASK14B6CoqEh1dXXauHGjFi1apLy8vMC6\n+vp65efna/369SooKFBhYaGOHTvWYpu8vDwtXLhQGzZskN/vV1FRkbxer372s5/p8ccfV2Fhofr3\n76/jx4+HbsQAACD4OwClpaUaN26cJGn48OHau3dvYN2BAwcUGxsrj8cjSUpOTtbOnTtVVlbWpE15\nebkkqby8XMnJyZKk8ePHq6SkRBEREUpISFB+fr4OHz6sjIwM9e7du2NHCQAAmggaAKqrqxUVFfXv\nBm63/H6/nE7nWet69Oihqqoqeb3eJstdLpcaGhpkjAksi4yMVHV1tY4fP6433nhDv//97xUREaHv\nfve7GjFihGJjYztqjAAA4AxBPwLweDzyer2Bx42//BvXVVdXB9Z5vV717Nmz2TYulyvQrnHb6Oho\n9erVS8OGDVOfPn3Uo0cPJScn65133umQwQEAgOYFfQcgMTFRW7duVVpamsrKypSQkBBYFx8fr4MH\nD+rEiROKiIjQ7t27NWvWLElqts2QIUO0a9cujRw5Utu2bdPo0aM1dOhQvffee/r000/l8Xi0Z88e\n3XbbbSEa7r85nQ7FxETJ7Q76FDQrJiYq+EYh1tV9sL3+hdIHAGiLoL/9UlNTVVJSoszMTEmnTuTb\nvHmzampqlJGRoZycHM2cOVPGGKWnp6tv377NtpGk7OxsLV26VD6fT/Hx8UpLS5PD4dDChQs1c+ZM\nORwO3XjjjfrKV74SwiGf4vcbVVRUtSkAxMREqaKiKgS9unj6YHv9C6EPhA8A7RH0t5/D4dCKFSua\nLBs4cGDg/ykpKUpJSQnaRpLi4uJUUFBw1vIbb7xRN954Y2v7DAAA2okLAQEAYCECAAAAFiIAAABg\nIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCEC\nAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgBg\nIWOMcnNzlZmZqRkzZujw4cNN1m/ZskXp6enKzMzUM888c842hw4d0tSpUzVt2jStWLGiyX6OHTum\nG264QXV1dZKk2tpa/eAHP9B3v/tdzZ07V8ePH++E0QJoDgEAsFBRUZHq6uq0ceNGLVq0SHl5eYF1\n9fX1ys/P1/r161VQUKDCwkIdO3asxTZ5eXlauHChNmzYIL/fr6KiIknS9u3bNWvWLFVWVgb2/fTT\nTyshIUFPPfWUvvOd72jdunWdO3AAAQQAwEKlpaUaN26cJGn48OHau3dvYN2BAwcUGxsrj8ejsLAw\nJScna+fOnWe1KS8vlySVl5crOTlZkjR+/Hjt2LFDkuRyubR+/Xr17NmzSd3x48eftS2Azufu6g4A\n6HzV1dWKiooKPHa73fL7/XI6nWet69Gjh6qqquT1epssd7lcamhokDEmsCwyMlJVVVWSpGuvvVaS\nmqyvrq6Wx+MJbFtdXR2aAQIIigAAWMjj8cjr9QYeN/7yb1x3+i9mr9ernj17NtvG5XIF2jVuGx0d\n3aSWw+Fotu6ZgeJcYmJat11bde8eJn3WtraRkd3a3b9Qj68r632Rx9YV9ToSAQCwUGJiorZu3aq0\ntDSVlZUpISEhsC4+Pl4HDx7UiRMnFBERod27d2vWrFmS1GybIUOGaNeuXRo5cqS2bdum0aNHN6l1\n+jsAiYmJKi4u1rBhw1RcXBz46CCYioqq9g75nGpqfG1u6/XWtqt/MTFRIR9fV9X7Io+ts+uFImgQ\nAAALpaamqqSkRJmZmZJOnci3efNm1dTUKCMjQzk5OZo5c6aMMUpPT1ffvn2bbSNJ2dnZWrp0qXw+\nn+Lj45WWltak1unvAGRlZSk7O1tTp05VeHi41qxZ00kjBnAmAgBgIYfDcdZX9gYOHBj4f0pKilJS\nUoK2kaS4uDgVFBS0WOu1114L/D8iIkIPP/xwG3sNoCPxLQAAACxEAAAAwEIEAAAALEQAAADAQgQA\nAAAsRAAAAMBCBAAAACxEAAAAwEIEAAAALEQAAADAQgQAAAAsRAAAAMBCBAAAACxEAAAAwEIEAAAA\nLEQAAADAQgQAAAAsRAAAAMBCBAAAACxEAAAAwEIEAAAALEQAAADAQgQAAAAsFDQAGGOUm5urzMxM\nzZgxQ4cPH26yfsuWLUpPT1dmZqaeeeaZc7Y5dOiQpk6dqmnTpmnFihVn1Zk9e7YKCws7amwAAKAF\nQQNAUVGR6urqtHHjRi1atEh5eXmBdfX19crPz9f69etVUFCgwsJCHTt2rMU2eXl5WrhwoTZs2CC/\n36+ioqLAvn7+85+rqqoqBEMEAABnChoASktLNW7cOEnS8OHDtXfv3sC6AwcOKDY2Vh6PR2FhYUpO\nTtbOnTvPalNeXi5JKi8vV3JysiRp/Pjx2rFjhyTp5ZdfltPp1NixYzt2dAAAoFlBA0B1dbWioqIC\nj91ut/x+f7PrevTooaqqKnm93ibLXS6XGhoaZIwJLIuMjFRVVZXee+89bd68WT/4wQ86ZEAAACA4\nd7ANPB6PvF5v4LHf75fT6Qysq66uDqzzer3q2bNns21cLlegXeO20dHRevHFF/Xxxx9rxowZOnLk\niMLDw9W/f/+QvxvgdDoUExMltzvoU9CsmJio4BuFWFf3wfb6F0ofAKAtgv72S0xM1NatW5WWlqay\nsjIlJCQE1sXHx+vgwYM6ceKEIiIitHv3bs2aNUuSmm0zZMgQ7dq1SyNHjtS2bds0evRoTZo0KbC/\ntWvXKiYmplM+CvD7jSoqqtoUAGJiolRR0bXnK3R1H2yvfyH0gfABoD2C/vZLTU1VSUmJMjMzJZ06\nkW/z5s2qqalRRkaGcnJyNHPmTBljlJ6err59+zbbRpKys7O1dOlS+Xw+xcfHKy0tLYRDAwAALQka\nABwOx1lf2Rs4cGDg/ykpKUpJSQnaRpLi4uJUUFDQYq277747WHcAAEAH4EJAAABYiAAAAICFCAAA\nAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABY\niAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgA\nAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAA\ngIUIAADpki9qAAARWUlEQVQAWIgAAACAhQgAAABYiAAAAICF3F3dAQCdzxij5cuXa//+/QoPD9eq\nVas0YMCAwPotW7Zo3bp1crvdmjJlijIyMlpsc+jQIS1ZskROp1ODBg1Sbm6uJGnTpk0qLCxUWFiY\n5s2bp5SUFEnS+PHjFRcXJ0kaMWKEFixY0NnDByACAGCloqIi1dXVaePGjdqzZ4/y8vK0bt06SVJ9\nfb3y8/P1/PPPq1u3bsrKytKECRNUWlrabJu8vDwtXLhQycnJys3NVVFRka655hoVFBTohRde0Oef\nf66srCyNGTNGH330kYYOHarHHnusi58BAAQAwEKlpaUaN26cJGn48OHau3dvYN2BAwcUGxsrj8cj\nSUpOTtbOnTtVVlbWpE15ebkkqby8XMnJyZJO/XVfUlIip9OppKQkud1ueTwexcXFaf/+/Tp06JCO\nHj2qGTNmqHv37lqyZIkGDhzYmUMH8H84BwCwUHV1taKiogKP3W63/H5/s+t69Oihqqoqeb3eJstd\nLpcaGhpkjAksi4yMVHV19VnbNu6jb9++mjt3rv73f/9Xc+bM0eLFi0M5TADnwDsAgIU8Ho+8Xm/g\nsd/vl9PpDKyrrq4OrPN6verZs2ezbVwuV6Bd47bR0dHN7iM6Olrx8fFyuVySpKSkJFVUVLSqvzEx\nUcE3aofu3cOkz9rWNjKyW7v7F+rxdWW9L/LYuqJeRyIAABZKTEzU1q1blZaWprKyMiUkJATWxcfH\n6+DBgzpx4oQiIiK0e/duzZo1S5KabTNkyBDt2rVLI0eO1LZt2zR69GgNGzZMDz30kOrq6lRbW6v3\n339fgwYN0i9+8Qv16tVLd955p/bt26fLL7+8Vf2tqKjq+CfhNDU1vja39Xpr29W/mJiokI+vq+p9\nkcfW2fVCETQIAICFUlNTVVJSoszMTElSXl6eNm/erJqaGmVkZCgnJ0czZ86UMUbp6enq27dvs20k\nKTs7W0uXLpXP51N8fLzS0tLkcDg0ffp0TZ06VcYYLVy4UOHh4YG3/YuLi+V2uwP7AND5CACAhRwO\nh1asWNFk2ekn46WkpAS+tneuNpIUFxengoKCs5ZnZGQoIyOjybLo6Gg9/vjj7eg5gI7CSYAAAFiI\nAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFgo6HUAOuO2oevXr9ef/vQnORwOjR8/Xnfd\ndVfoRgwAAIK/A3D6bUMXLVrU5MpdjbcNXb9+vQoKClRYWKhjx4612KbxtqEbNmyQ3+9XUVGRDh8+\nrM2bNwfuHb59+3a9++67oRsxAAAIHgBae9vQsLCwwG1Dz2zT0m1Dd+zYoX79+umJJ54I7LO+vl7d\nunXruBECAICzBA0AobxtaFVVlVwul3r16iVJWr16tYYMGaLY2Nj2jwwAALQo6DkAob5tqCTV1dUp\nJydHUVFRWr58ebsH1RpOp0MxMVFyu9t2O4QL4RaQXd0H2+tfKH0AgLYI+tsv1LcNlaT58+fr2muv\n1Z133hmKMTbL7zeqqKhqUwDo7FtOXoh9sL3+hdAHwgeA9gj62y/Utw0tKirS7t275fP5VFxcLIfD\noUWLFmn48OEhHDYAAHYLGgBCfdvQiRMnas+ePefTZwAA0E5cCAgAAAsRAAAAsBABAAAACxEAAACw\nEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBAB\nAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAA\nAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAAL\nEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEA\nAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALCQO9gGxhgtX75c\n+/fvV3h4uFatWqUBAwYE1m/ZskXr1q2T2+3WlClTlJGR0WKbQ4cOacmSJXI6nRo0aJByc3MlSZs2\nbVJhYaHCwsI0b948paSkhGzAALpuXtfW1mrx4sWqrKyUx+NRfn6+evfu3VVPA2C1oO8AFBUVqa6u\nThs3btSiRYuUl5cXWFdfX6/8/HytX79eBQUFKiws1LFjx1psk5eXp4ULF2rDhg3y+/0qKirSJ598\nEmj7xBNPaM2aNfL5fKEbMYAum9dPP/20EhIS9NRTT+k73/mO1q1b11VPAWC9oO8AlJaWaty4cZKk\n4cOHa+/evYF1Bw4cUGxsrDwejyQpOTlZO3fuVFlZWZM25eXlkqTy8nIlJydLksaPH6+SkhI5nU4l\nJSXJ7XbL4/EoLi5O+/fv11e/+tWOHekZjN+vAwf+n9xu13m3PX7co2PHqgOP4+KukMt1/vsBukpX\nzOt9+/aptLRUs2fPDmxLAAC6TtAAUF1draioqH83cLvl9/vldDrPWtejRw9VVVXJ6/U2We5yudTQ\n0CBjTGBZZGSkqqurz9q2cR/nYqoPyq/PWzfCFlR9tFffX/EvRXj6tGs/n1cf032zU/XlL8e2az/n\n68wQ0tlsr98RfYiPH9SBvTk/XTGvG5c3BovGbS8IDbXyV74lSXK5nWqo97e66fEIpw4ceK/NpTv7\ntdyZ9b7IY2upXlfO6/MVNAB4PB55vd7A48aDROO60yew1+tVz549m23jcrkC7Rq3jY6ObnYf0dHR\n5+xT0bOPtGJoAFrSVfP69H2cGRLOJSamddu11eoVPwrp/oELUdBzABITE1VcXCxJKisrU0JCQmBd\nfHy8Dh48qBMnTqiurk67d+/WNddcoxEjRjTbZsiQIdq1a5ckadu2bUpKStKwYcNUWlqquro6VVVV\n6f3339egQRdPggIuRl01r0/fR3FxceCjAwCdz2FOf/+uGaef+SudOuGnvLxcNTU1ysjI0Ouvv661\na9fKGKP09HRlZWU122bgwIH65z//qaVLl8rn8yk+Pl4rV66Uw+HQM888o8LCQhljNH/+fE2cODH0\nIwcs1lXz+vPPP1d2drYqKioUHh6uNWvW6JJLLunKpwKwVtAAAAAAvni4EBAAABYiAAAAYCECAAAA\nFgr6NcALSbDLl7ZHfX297r33Xh05ckQ+n0/z5s3TV77ylS65xGllZaWmTJmiJ598Ui6Xq1P78Ktf\n/UpbtmyRz+fT1KlTNXLkyE6tX19fr+zsbB05ckRut1v3339/pz0He/bs0c9+9jMVFBR0yOVty8rK\n9MADD8jtduu6667T3Xff3er677zzjlauXCmXy6Xw8HA9+OCD6tOnT0jrd4VXX31Vf/7zn7VmzRpJ\np56DVatWndXntWvXqri4WG63Wzk5Obr66qt1/Phx/fjHP1Ztba369u2rvLw8devWrdnLGLdGRx1f\nOut1FKpjVkv1/H6/7rvvPv3jH/+Q0+nUihUrFB4eHtJ50tHHwnPVuuWWWwLXqPjSl76kefPmhbRe\nKI615z3nzUXklVdeMUuWLDHGGFNWVmbmz5/fYft+7rnnzAMPPGCMMeazzz4zKSkpZt68eWbXrl3G\nGGOWLVtmXn31VVNRUWEmT55sfD6fqaqqMpMnTzZ1dXXmySefNI888ogxxpg//vGPZuXKlW3qh8/n\nM3fddZe54YYbzPvvv9+pfXjjjTfMvHnzjDHGeL1e88gjj3T6c1BUVGR+9KMfGWOMKSkpMffcc0+n\n9OG///u/zeTJk81tt91mjDEdUvM73/mOOXz4sDHGmNmzZ5t33nmn1fWnTZtm9u3bZ4wxZuPGjSY/\nPz+k9bvCypUrzaRJk8zChQsDy5rrc3l5ubn99tuNMcZ8+OGHZsqUKcYYY+6//37zwgsvGGOMefzx\nx8369euNz+czqamppqqqytTV1ZkpU6aYysrKVvWnI44vnfk6CtUxq6V6r776qrn33nuNMaeOFfPn\nzw9pvVAcC1uqVVtba26++eYmP8tQ1gvVsfZ85/xF9RHAuS5f2l6TJk3SD3/4Q0lSQ0ODXC6X3n77\n7SaXOP3rX/+qv//97y1e4nT8+PGBbXfs2NGmfqxevVpZWVnq27evjDGd2oft27crISFB3//+9zV/\n/nylpKR0+nMQFxcXuLpcVVWV3G53p/QhNjZWjz76aODxmZe3PZ+af/vb31RdXS2fz6cvfelLkqSx\nY8fqr3/9a6vrP/TQQxo8eLCkU3/phYeHh7R+V0hMTNTy5csDj5vrc0lJiUpLSzVmzBhJ0uWXXy6/\n369jx47pzTffDBwPGn/Wp1/GOCwsTElJSYFrFATTEceXznwddfQxK1i9iRMn6v7775ckffjhh+rZ\ns2dI63XksTBYrX379unkyZOaNWuW7rjjDu3Zsyek9Tr6WNvWOX9RBYCWLl/aEbp37x64XOkPf/hD\nLViwoNMvcfr888/rkksu0ZgxYwK1Tx9fqPtw/Phx7d27V7/4xS+0fPly/fjHP+7U+o3tPvjgA6Wl\npWnZsmWaPn16p/wcUlNTm9zPoT01Gy+b27js9OWtrX/ppZdKkt5880399re/1R133NHsJXo7qn4o\nPfvss/r2t7/d5N/evXs1adKkJtu11Oczn/fmfh7n2ra14+6I40tnvo46+pjVmteN0+nUkiVLtHLl\nSk2ePDlk9Tr6WBhsbBEREZo1a5Z+/etfB459oXwuO/pY29Y5f1GdA3Cuy5d2hI8++kh33323pk2b\npm9961v66U9/GlgXqkucnu7555+Xw+FQSUmJ9u/fr+zsbB0/frzT+tCrVy/Fx8fL7XZr4MCB6tat\nm44ePdqpz8H69es1btw4LViwQEePHtX06dOb3B2yM/ogqd2Xtz0zfLTmEtdn+tOf/qTHH39cv/rV\nr9S7d+9Or99R0tPTlZ6eHnS75vrcs2dPhYWFNZn31dXVio6ODmzfp0+fwLjbcmnxRqE4voT6ddTR\nx6zWvG7y8/NVWVmp9PR01dbWhqReKI6F5xpbXFycYmNjA//v1auX3n777ZDVC8Wxti1z/qJ6B+Bc\nly9tr08++USzZs3S4sWLdfPNN0uSrrrqqk69xOmGDRtUUFCggoICXXnllXrwwQc1bty4TutDUlKS\n/vKXv0iSjh49qpqaGo0ePVo7d+7stOeg8ZrzkhQVFaX6+noNGTKkU/sgtf/yth6PR+Hh4Tp8+LCM\nMdq+fbuSkpJaXf/FF1/UU089pYKCAvXv31+SdPXVV3da/a7QUp9HjBih7du3yxijDz/8UMYY9erV\nS4mJidq2bZukUz+j5ORkXXHFFU0uY7xr1y5dc801raofiuNLKF9HoThmnaveiy++qF/96leSpG7d\nusnpdOqrX/1qu+ZmS/VCcSw819iee+455efnSzp17KuurtaYMWNCMjYpNMfatsz5i+pKgKaFS5F2\nhFWrVumll17SFVdcIWOMHA6HfvKTn2jlypVdconTGTNmaMWKFXI4HJ16mdWf/exn+tvf/iZjjBYt\nWqT+/fvrvvvu67T6J0+e1L333quKigrV19fr9ttv19ChQzulD0eOHNGiRYu0cePGDrm87d///net\nWrVKfr9fY8aM0Y9+dO4bzjTW/+1vf6trr71W/fr1k8fjkcPh0KhRo3T33XeHtH5X2LlzpwoLCwPf\nAmipz2vXrtW2bdtkjFFOTo4SExNVWVmp7OxsnTx5Ur1799aaNWsUERHR7GWMW6Ojji+d9ToK1TGr\npXo1NTXKycnRJ598ovr6es2dO1dXXHFFu+dmsNdpRx4LW6rl8/mUk5OjDz/8UE6nU4sXL1avXr1C\nOrZQHGvPd85fVAEAAAB0jIvqIwAAANAxCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICF\nCAAAAFjo/wOY67O5O3hY0wAAAABJRU5ErkJggg==\n", + "text/plain": [ + "<matplotlib.figure.Figure at 0x43a236a0>" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import seaborn as sns\n", + "df_cln2.hist(normed=True)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Single pipeline" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "all_pipeline = Pipeline([\n", + " ('transform',mimic_transform),\n", + " ('format',standard_pipeline),\n", + " ('clean',cleaning_pipeline)\n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>382993.000000</td>\n", + " <td>393608</td>\n", + " <td>393608</td>\n", + " <td>393608</td>\n", + " <td>393608.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>NaN</td>\n", + " <td>187323</td>\n", + " <td>616</td>\n", + " <td>2</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>NaN</td>\n", + " <td>2140-07-14 03:59:00</td>\n", + " <td>1.2</td>\n", + " <td>mmol/L</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>NaN</td>\n", + " <td>8</td>\n", + " <td>20704</td>\n", + " <td>393592</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>first</th>\n", + " <td>NaN</td>\n", + " <td>2096-08-25 16:32:00</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>last</th>\n", + " <td>NaN</td>\n", + " <td>2210-08-19 04:56:00</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>150112.612539</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>64364.242439</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>28874.716612</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>77900.842790</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>100001.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>818.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>125190.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1531.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>149789.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>50813.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>175567.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>50813.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>199999.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>225668.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "count 382993.000000 393608 393608 393608 393608.000000\n", + "unique NaN 187323 616 2 NaN\n", + "top NaN 2140-07-14 03:59:00 1.2 mmol/L NaN\n", + "freq NaN 8 20704 393592 NaN\n", + "first NaN 2096-08-25 16:32:00 NaN NaN NaN\n", + "last NaN 2210-08-19 04:56:00 NaN NaN NaN\n", + "mean 150112.612539 NaN NaN NaN 64364.242439\n", + "std 28874.716612 NaN NaN NaN 77900.842790\n", + "min 100001.000000 NaN NaN NaN 818.000000\n", + "25% 125190.000000 NaN NaN NaN 1531.000000\n", + "50% 149789.000000 NaN NaN NaN 50813.000000\n", + "75% 175567.000000 NaN NaN NaN 50813.000000\n", + "max 199999.000000 NaN NaN NaN 225668.000000" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "label = 'lactate'\n", + "df = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n", + "df.describe(include='all')" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th>mmol/L</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>100001</th>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>1.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100003</th>\n", + " <th>2150-04-17 19:12:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100006</th>\n", + " <th>2108-04-08 10:58:00</th>\n", + " <td>4.5</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100007</th>\n", + " <th>2145-03-31 00:44:00</th>\n", + " <td>3.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2145-04-02 14:10:00</th>\n", + " <td>1.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100009</th>\n", + " <th>2162-05-17 13:19:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2162-05-17 17:14:00</th>\n", + " <td>1.5</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">100010</th>\n", + " <th>2109-12-10 10:25:00</th>\n", + " <td>0.6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 12:11:00</th>\n", + " <td>0.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:05:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:58:00</th>\n", + " <td>0.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100011</th>\n", + " <th>2177-08-29 04:44:00</th>\n", + " <td>3.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-08-29 06:55:00</th>\n", + " <td>2.3</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100012</th>\n", + " <th>2177-03-14 07:38:00</th>\n", + " <td>2.3</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-14 11:42:00</th>\n", + " <td>2.5</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 08:05:00</th>\n", + " <td>2.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 14:01:00</th>\n", + " <td>2.6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 21:42:00</th>\n", + " <td>1.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100016</th>\n", + " <th>2188-05-24 12:00:00</th>\n", + " <td>2.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100017</th>\n", + " <th>2103-03-11 05:10:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100018</th>\n", + " <th>2176-08-29 15:29:00</th>\n", + " <td>1.3</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 09:23:00</th>\n", + " <td>0.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 10:19:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 11:29:00</th>\n", + " <td>0.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 12:40:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100020</th>\n", + " <th>2142-11-30 21:54:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2142-12-03 00:17:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100024</th>\n", + " <th>2170-09-19 10:25:00</th>\n", + " <td>1.4</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-19 16:33:00</th>\n", + " <td>2.6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-20 02:04:00</th>\n", + " <td>3.2</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199976</th>\n", + " <th>2182-02-14 11:15:00</th>\n", + " <td>0.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-16 03:57:00</th>\n", + " <td>0.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-19 03:59:00</th>\n", + " <td>0.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-20 03:31:00</th>\n", + " <td>0.7</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-21 04:55:00</th>\n", + " <td>0.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199979</th>\n", + " <th>2182-02-06 09:17:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-06 14:16:00</th>\n", + " <td>3.8</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">199981</th>\n", + " <th>2110-09-24 16:34:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-24 20:09:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-25 06:10:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>199987</th>\n", + " <th>2175-05-19 16:30:00</th>\n", + " <td>2.3</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"6\" valign=\"top\">199988</th>\n", + " <th>2169-01-24 12:48:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 01:35:00</th>\n", + " <td>1.6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 11:18:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 16:43:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 22:35:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-10 05:33:00</th>\n", + " <td>1.4</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199993</th>\n", + " <th>2161-11-12 23:14:00</th>\n", + " <td>0.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2161-11-13 03:46:00</th>\n", + " <td>0.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">199994</th>\n", + " <th>2188-07-07 21:23:00</th>\n", + " <td>1.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 03:09:00</th>\n", + " <td>0.7</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 04:13:00</th>\n", + " <td>0.6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 06:20:00</th>\n", + " <td>0.7</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199998</th>\n", + " <th>2119-02-20 10:52:00</th>\n", + " <td>1.1</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 12:36:00</th>\n", + " <td>1.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:33:00</th>\n", + " <td>2.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:59:00</th>\n", + " <td>2.6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 20:43:00</th>\n", + " <td>1.3</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199999</th>\n", + " <th>2136-04-04 20:55:00</th>\n", + " <td>1.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-06 15:29:00</th>\n", + " <td>1.8</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>177439 rows × 1 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label lactate\n", + "status known\n", + "variable_type qn\n", + "units mmol/L\n", + "id datetime \n", + "100001 2117-09-11 09:32:00 1.9\n", + "100003 2150-04-17 19:12:00 1.1\n", + "100006 2108-04-08 10:58:00 4.5\n", + "100007 2145-03-31 00:44:00 3.1\n", + " 2145-04-02 14:10:00 1.9\n", + "100009 2162-05-17 13:19:00 1.1\n", + " 2162-05-17 17:14:00 1.5\n", + "100010 2109-12-10 10:25:00 0.6\n", + " 2109-12-10 12:11:00 0.9\n", + " 2109-12-10 13:05:00 1.0\n", + " 2109-12-10 13:58:00 0.8\n", + "100011 2177-08-29 04:44:00 3.8\n", + " 2177-08-29 06:55:00 2.3\n", + "100012 2177-03-14 07:38:00 2.3\n", + " 2177-03-14 11:42:00 2.5\n", + " 2177-03-15 08:05:00 2.1\n", + " 2177-03-15 14:01:00 2.6\n", + " 2177-03-15 21:42:00 1.8\n", + "100016 2188-05-24 12:00:00 2.0\n", + "100017 2103-03-11 05:10:00 1.1\n", + "100018 2176-08-29 15:29:00 1.3\n", + " 2176-08-30 09:23:00 0.9\n", + " 2176-08-30 10:19:00 1.0\n", + " 2176-08-30 11:29:00 0.9\n", + " 2176-08-30 12:40:00 1.1\n", + "100020 2142-11-30 21:54:00 1.1\n", + " 2142-12-03 00:17:00 1.0\n", + "100024 2170-09-19 10:25:00 1.4\n", + " 2170-09-19 16:33:00 2.6\n", + " 2170-09-20 02:04:00 3.2\n", + "... ...\n", + "199976 2182-02-14 11:15:00 0.8\n", + " 2182-02-16 03:57:00 0.8\n", + " 2182-02-19 03:59:00 0.8\n", + " 2182-02-20 03:31:00 0.7\n", + " 2182-02-21 04:55:00 0.9\n", + "199979 2182-02-06 09:17:00 1.0\n", + " 2182-02-06 14:16:00 3.8\n", + "199981 2110-09-24 16:34:00 1.1\n", + " 2110-09-24 20:09:00 1.0\n", + " 2110-09-25 06:10:00 1.0\n", + "199987 2175-05-19 16:30:00 2.3\n", + "199988 2169-01-24 12:48:00 1.0\n", + " 2169-02-07 01:35:00 1.6\n", + " 2169-02-07 11:18:00 1.0\n", + " 2169-02-07 16:43:00 1.0\n", + " 2169-02-07 22:35:00 1.1\n", + " 2169-02-10 05:33:00 1.4\n", + "199993 2161-11-12 23:14:00 0.9\n", + " 2161-11-13 03:46:00 0.9\n", + "199994 2188-07-07 21:23:00 1.0\n", + " 2188-07-08 03:09:00 0.7\n", + " 2188-07-08 04:13:00 0.6\n", + " 2188-07-08 06:20:00 0.7\n", + "199998 2119-02-20 10:52:00 1.1\n", + " 2119-02-20 12:36:00 1.9\n", + " 2119-02-20 13:33:00 2.0\n", + " 2119-02-20 13:59:00 2.6\n", + " 2119-02-20 20:43:00 1.3\n", + "199999 2136-04-04 20:55:00 1.9\n", + " 2136-04-06 15:29:00 1.8\n", + "\n", + "[177439 rows x 1 columns]" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "all_pipeline.set_params(transform__add_level__level_val=label)\n", + "all_pipeline.transform(df)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Loop over everything" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import logger" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:18:23) heart rate\n", + "(2017-06-03 07:18:23)>> Open Extract\n", + "(2017-06-03 07:18:26)<< DONE (3.0s)\n", + "(2017-06-03 07:18:26)>> Run Pipeline\n", + "(2017-06-03 07:21:19)<< DONE (173.0s)\n", + "(2017-06-03 07:21:19)>> Analyze...\n", + "((7952939, 1), (7922961, 1), 29978L, 171, '0.3015% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>heart rate</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>beats/min</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>7.922961e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>1.026618e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>3.552932e+03</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-8.800000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>7.700000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>9.200000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>1.190000e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>9.999999e+06</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label heart rate\n", + "status known\n", + "variable_type qn\n", + "units beats/min\n", + "count 7.922961e+06\n", + "mean 1.026618e+02\n", + "std 3.552932e+03\n", + "min -8.800000e+01\n", + "25% 7.700000e+01\n", + "50% 9.200000e+01\n", + "75% 1.190000e+02\n", + "max 9.999999e+06" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:21:20)<< DONE (1.0s)\n", + "(2017-06-03 07:21:20)>> Joining!\n", + "(2017-06-03 07:21:20)<< DONE (0.0s)\n", + "(2017-06-03 07:21:20) DONE (177.0s)\n", + "(2017-06-03 07:21:20) blood pressure systolic\n", + "(2017-06-03 07:21:20)>> Open Extract\n", + "(2017-06-03 07:21:23)<< DONE (3.0s)\n", + "(2017-06-03 07:21:23)>> Run Pipeline\n", + "(2017-06-03 07:25:39)<< DONE (256.0s)\n", + "(2017-06-03 07:25:39)>> Analyze...\n", + "((6374824, 1), (5974186, 1), 548979L, 174, '0.307% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>blood pressure systolic</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mmHg</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>5.825845e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>1.214682e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>1.311542e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-6.900000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>1.040000e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>1.190000e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>1.370000e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>1.411460e+05</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label blood pressure systolic\n", + "status known\n", + "variable_type qn\n", + "units mmHg\n", + "count 5.825845e+06\n", + "mean 1.214682e+02\n", + "std 1.311542e+02\n", + "min -6.900000e+01\n", + "25% 1.040000e+02\n", + "50% 1.190000e+02\n", + "75% 1.370000e+02\n", + "max 1.411460e+05" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:25:40)<< DONE (1.0s)\n", + "(2017-06-03 07:25:40)>> Joining!\n", + "(2017-06-03 07:26:28)<< DONE (48.0s)\n", + "(2017-06-03 07:26:28) DONE (308.0s)\n", + "(2017-06-03 07:26:28) blood pressure diastolic\n", + "(2017-06-03 07:26:28)>> Open Extract\n", + "(2017-06-03 07:26:31)<< DONE (3.0s)\n", + "(2017-06-03 07:26:31)>> Run Pipeline\n", + "(2017-06-03 07:30:32)<< DONE (241.0s)\n", + "(2017-06-03 07:30:32)>> Analyze...\n", + "((6371249, 1), (5976313, 1), 543269L, 170, '0.2999% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>blood pressure diastolic</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mmHg</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>5.827980e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>6.115824e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>2.350768e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-1.600000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>5.000000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>5.900000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>6.900000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>1.141090e+05</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label blood pressure diastolic\n", + "status known\n", + "variable_type qn\n", + "units mmHg\n", + "count 5.827980e+06\n", + "mean 6.115824e+01\n", + "std 2.350768e+02\n", + "min -1.600000e+01\n", + "25% 5.000000e+01\n", + "50% 5.900000e+01\n", + "75% 6.900000e+01\n", + "max 1.141090e+05" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:30:34)<< DONE (2.0s)\n", + "(2017-06-03 07:30:34)>> Joining!\n", + "(2017-06-03 07:31:25)<< DONE (51.0s)\n", + "(2017-06-03 07:31:25) DONE (297.0s)\n", + "(2017-06-03 07:31:25) blood pressure mean\n", + "(2017-06-03 07:31:25)>> Open Extract\n", + "(2017-06-03 07:31:26)<< DONE (1.0s)\n", + "(2017-06-03 07:31:26)>> Run Pipeline\n", + "(2017-06-03 07:32:39)<< DONE (73.0s)\n", + "(2017-06-03 07:32:39)>> Analyze...\n", + "((2536271, 1), (2415995, 1), 120276L, 0, '0.0% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>blood pressure mean</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mmHg</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>2.415995e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>7.879668e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>1.413279e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-1.350000e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>6.700000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>7.700000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>8.800000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>1.201300e+05</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label blood pressure mean\n", + "status known\n", + "variable_type qn\n", + "units mmHg\n", + "count 2.415995e+06\n", + "mean 7.879668e+01\n", + "std 1.413279e+02\n", + "min -1.350000e+02\n", + "25% 6.700000e+01\n", + "50% 7.700000e+01\n", + "75% 8.800000e+01\n", + "max 1.201300e+05" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:32:40)<< DONE (1.0s)\n", + "(2017-06-03 07:32:40)>> Joining!\n", + "(2017-06-03 07:33:20)<< DONE (40.0s)\n", + "(2017-06-03 07:33:20) DONE (115.0s)\n", + "(2017-06-03 07:33:20) respiratory rate\n", + "(2017-06-03 07:33:20)>> Open Extract\n", + "(2017-06-03 07:33:24)<< DONE (4.0s)\n", + "(2017-06-03 07:33:24)>> Run Pipeline\n", + "(2017-06-03 07:37:33)<< DONE (249.0s)\n", + "(2017-06-03 07:37:33)>> Analyze...\n", + "((7810019, 1), (7780015, 1), 5072936L, 172, '0.3035% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>respiratory rate</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>insp/min</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>2.737083e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>2.092347e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>1.423811e+03</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000e+00</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>1.600000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>2.000000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>2.400000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>2.355555e+06</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label respiratory rate\n", + "status known\n", + "variable_type qn\n", + "units insp/min\n", + "count 2.737083e+06\n", + "mean 2.092347e+01\n", + "std 1.423811e+03\n", + "min 0.000000e+00\n", + "25% 1.600000e+01\n", + "50% 2.000000e+01\n", + "75% 2.400000e+01\n", + "max 2.355555e+06" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:37:35)<< DONE (2.0s)\n", + "(2017-06-03 07:37:35)>> Joining!\n", + "(2017-06-03 07:38:29)<< DONE (54.0s)\n", + "(2017-06-03 07:38:29) DONE (309.0s)\n", + "(2017-06-03 07:38:29) temperature body\n", + "(2017-06-03 07:38:29)>> Open Extract\n", + "(2017-06-03 07:38:31)<< DONE (2.0s)\n", + "(2017-06-03 07:38:31)>> Run Pipeline\n", + "(2017-06-03 07:39:35)<< DONE (64.0s)\n", + "(2017-06-03 07:39:35)>> Analyze...\n", + "((1751447, 1), (1731794, 1), 461152L, 156, '0.3189% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>degF</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>1.290295e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>9.850479e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>9.563484e+00</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-9.990000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>9.760000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>9.850000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>9.950000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>9.637000e+03</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label temperature body\n", + "status known\n", + "variable_type qn\n", + "units degF\n", + "count 1.290295e+06\n", + "mean 9.850479e+01\n", + "std 9.563484e+00\n", + "min -9.990000e+01\n", + "25% 9.760000e+01\n", + "50% 9.850000e+01\n", + "75% 9.950000e+01\n", + "max 9.637000e+03" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:39:36)<< DONE (1.0s)\n", + "(2017-06-03 07:39:36)>> Joining!\n", + "(2017-06-03 07:40:14)<< DONE (38.0s)\n", + "(2017-06-03 07:40:14) DONE (105.0s)\n", + "(2017-06-03 07:40:14) oxygen saturation pulse oximetry\n", + "(2017-06-03 07:40:14)>> Open Extract\n", + "(2017-06-03 07:40:17)<< DONE (3.0s)\n", + "(2017-06-03 07:40:17)>> Run Pipeline\n", + "(2017-06-03 07:42:42)<< DONE (145.0s)\n", + "(2017-06-03 07:42:42)>> Analyze...\n", + "((6099827, 1), (6073019, 1), 26808L, 163, '0.3326% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>oxygen saturation pulse oximetry</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>percent</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>6.073019e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>9.885942e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>2.942035e+03</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000e+00</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>9.600000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>9.800000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>9.900000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>6.363333e+06</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label oxygen saturation pulse oximetry\n", + "status known\n", + "variable_type qn\n", + "units percent\n", + "count 6.073019e+06\n", + "mean 9.885942e+01\n", + "std 2.942035e+03\n", + "min 0.000000e+00\n", + "25% 9.600000e+01\n", + "50% 9.800000e+01\n", + "75% 9.900000e+01\n", + "max 6.363333e+06" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:42:43)<< DONE (1.0s)\n", + "(2017-06-03 07:42:43)>> Joining!\n", + "(2017-06-03 07:43:35)<< DONE (52.0s)\n", + "(2017-06-03 07:43:35) DONE (201.0s)\n", + "(2017-06-03 07:43:35) weight body\n", + "(2017-06-03 07:43:35)>> Open Extract\n", + "(2017-06-03 07:43:36)<< DONE (1.0s)\n", + "(2017-06-03 07:43:36)>> Run Pipeline\n", + "(2017-06-03 07:43:40)<< DONE (4.0s)\n", + "(2017-06-03 07:43:40)>> Analyze...\n", + "((95425, 1), (94457, 1), 1956L, 158, '0.4958% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>weight body</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>kg</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>9.346900e+04</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>2.676828e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>3.908673e+04</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000e+00</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>6.980000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>8.340000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>9.890000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>8.654765e+06</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label weight body\n", + "status known\n", + "variable_type qn\n", + "units kg\n", + "count 9.346900e+04\n", + "mean 2.676828e+02\n", + "std 3.908673e+04\n", + "min 0.000000e+00\n", + "25% 6.980000e+01\n", + "50% 8.340000e+01\n", + "75% 9.890000e+01\n", + "max 8.654765e+06" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:43:40)<< DONE (0.0s)\n", + "(2017-06-03 07:43:40)>> Joining!\n", + "(2017-06-03 07:44:15)<< DONE (35.0s)\n", + "(2017-06-03 07:44:15) DONE (40.0s)\n", + "(2017-06-03 07:44:15) output urine\n", + "(2017-06-03 07:44:15)>> Open Extract\n", + "(2017-06-03 07:44:16)<< DONE (1.0s)\n", + "(2017-06-03 07:44:16)>> Run Pipeline\n", + "(2017-06-03 07:47:57)<< DONE (221.0s)\n", + "(2017-06-03 07:47:57)>> Analyze...\n", + "((3644639, 1), (3624029, 1), 417242L, 92, '0.1758% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>output urine</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mL</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>3.216363e+06</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>1.265574e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>2.577291e+03</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-1.500000e+03</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>4.200000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>8.000000e+01</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>1.600000e+02</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>4.555555e+06</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label output urine\n", + "status known\n", + "variable_type qn\n", + "units mL\n", + "count 3.216363e+06\n", + "mean 1.265574e+02\n", + "std 2.577291e+03\n", + "min -1.500000e+03\n", + "25% 4.200000e+01\n", + "50% 8.000000e+01\n", + "75% 1.600000e+02\n", + "max 4.555555e+06" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:47:58)<< DONE (1.0s)\n", + "(2017-06-03 07:47:58)>> Joining!\n", + "(2017-06-03 07:48:43)<< DONE (45.0s)\n", + "(2017-06-03 07:48:43) DONE (268.0s)\n", + "(2017-06-03 07:48:43) glasgow coma scale motor\n", + "(2017-06-03 07:48:43)>> Open Extract\n", + "(2017-06-03 07:48:43)<< DONE (0.0s)\n", + "(2017-06-03 07:48:43)>> Run Pipeline\n", + "(2017-06-03 07:49:29)<< DONE (46.0s)\n", + "(2017-06-03 07:49:29)>> Analyze...\n", + "((952565, 1), (949198, 1), 3367L, 1, '0.0037% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>glasgow coma scale motor</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>ord</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>949198</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>6</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>Obeys commands</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>642879</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label glasgow coma scale motor\n", + "status known\n", + "variable_type ord\n", + "units no_units\n", + "count 949198\n", + "unique 6\n", + "top Obeys commands\n", + "freq 642879" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:49:29)<< DONE (0.0s)\n", + "(2017-06-03 07:49:29)>> Joining!\n", + "(2017-06-03 07:50:06)<< DONE (37.0s)\n", + "(2017-06-03 07:50:06) DONE (83.0s)\n", + "(2017-06-03 07:50:06) glasgow coma scale eye opening\n", + "(2017-06-03 07:50:06)>> Open Extract\n", + "(2017-06-03 07:50:07)<< DONE (1.0s)\n", + "(2017-06-03 07:50:07)>> Run Pipeline\n", + "(2017-06-03 07:50:50)<< DONE (43.0s)\n", + "(2017-06-03 07:50:50)>> Analyze...\n", + "((956672, 1), (953595, 1), 3077L, 1, '0.0037% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>glasgow coma scale eye opening</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>ord</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>953595</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>4</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>Eyes open spontaneously</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>588057</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label glasgow coma scale eye opening\n", + "status known\n", + "variable_type ord\n", + "units no_units\n", + "count 953595\n", + "unique 4\n", + "top Eyes open spontaneously\n", + "freq 588057" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:50:50)<< DONE (0.0s)\n", + "(2017-06-03 07:50:50)>> Joining!\n", + "(2017-06-03 07:51:28)<< DONE (38.0s)\n", + "(2017-06-03 07:51:28) DONE (82.0s)\n", + "(2017-06-03 07:51:28) glasgow coma scale verbal\n", + "(2017-06-03 07:51:28)>> Open Extract\n", + "(2017-06-03 07:51:29)<< DONE (1.0s)\n", + "(2017-06-03 07:51:29)>> Run Pipeline\n", + "(2017-06-03 07:52:14)<< DONE (45.0s)\n", + "(2017-06-03 07:52:14)>> Analyze...\n", + "((954700, 1), (950913, 1), 3787L, 2, '0.0074% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>glasgow coma scale verbal</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>ord</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>no_units</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>950913</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>5</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>No verbal response (>2 yrs); no vocal response...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>465193</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label glasgow coma scale verbal\n", + "status known\n", + "variable_type ord\n", + "units no_units\n", + "count 950913\n", + "unique 5\n", + "top No verbal response (>2 yrs); no vocal response...\n", + "freq 465193" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 07:52:14)<< DONE (0.0s)\n", + "(2017-06-03 07:52:14)>> Joining!\n", + "(2017-06-03 07:52:51)<< DONE (37.0s)\n", + "(2017-06-03 07:52:51) DONE (83.0s)\n", + "(2017-06-03 07:52:51) normal saline\n", + "(2017-06-03 07:52:51)>> Open Extract\n", + "(2017-06-03 07:52:51)<< DONE (0.0s)\n", + "(2017-06-03 07:52:51)>> Run Pipeline\n", + "(2017-06-03 08:01:38)<< DONE (527.0s)\n", + "(2017-06-03 08:01:38)>> Analyze...\n", + "((817373, 1), (504874, 2), 265615L, 8, '0.0405% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"2\" halign=\"left\">normal saline</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>49173.000000</td>\n", + " <td>456484.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>389.563178</td>\n", + " <td>75.626948</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>380.287765</td>\n", + " <td>217.512467</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>-906.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>100.000000</td>\n", + " <td>6.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>250.000000</td>\n", + " <td>15.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>500.000000</td>\n", + " <td>62.204886</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>11000.000000</td>\n", + " <td>51947.999400</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label normal saline \n", + "status known \n", + "variable_type qn \n", + "units mL mL/hr\n", + "count 49173.000000 456484.000000\n", + "mean 389.563178 75.626948\n", + "std 380.287765 217.512467\n", + "min 0.000000 -906.000000\n", + "25% 100.000000 6.000000\n", + "50% 250.000000 15.000000\n", + "75% 500.000000 62.204886\n", + "max 11000.000000 51947.999400" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 08:01:38)<< DONE (0.0s)\n", + "(2017-06-03 08:01:38)>> Joining!\n", + "(2017-06-03 08:02:15)<< DONE (37.0s)\n", + "(2017-06-03 08:02:15) DONE (564.0s)\n", + "(2017-06-03 08:02:15) lactated ringers\n", + "(2017-06-03 08:02:15)>> Open Extract\n", + "(2017-06-03 08:02:15)<< DONE (0.0s)\n", + "(2017-06-03 08:02:15)>> Run Pipeline\n", + "(2017-06-03 08:02:57)<< DONE (42.0s)\n", + "(2017-06-03 08:02:57)>> Analyze...\n", + "((504306, 1), (254175, 2), 19193L, 18, '0.1085% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"2\" halign=\"left\">lactated ringers</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>248510.000000</td>\n", + " <td>2161.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>204.109607</td>\n", + " <td>289.877760</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>338.277593</td>\n", + " <td>418.153805</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>15.000000</td>\n", + " <td>0.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>100.000000</td>\n", + " <td>99.994818</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>200.000000</td>\n", + " <td>499.999980</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>60000.000000</td>\n", + " <td>3923.333176</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label lactated ringers \n", + "status known \n", + "variable_type qn \n", + "units mL mL/hr\n", + "count 248510.000000 2161.000000\n", + "mean 204.109607 289.877760\n", + "std 338.277593 418.153805\n", + "min 0.000000 0.000000\n", + "25% 15.000000 0.000000\n", + "50% 100.000000 99.994818\n", + "75% 200.000000 499.999980\n", + "max 60000.000000 3923.333176" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 08:02:57)<< DONE (0.0s)\n", + "(2017-06-03 08:02:57)>> Joining!\n", + "(2017-06-03 08:03:34)<< DONE (37.0s)\n", + "(2017-06-03 08:03:34) DONE (79.0s)\n", + "(2017-06-03 08:03:34) norepinephrine\n", + "(2017-06-03 08:03:34)>> Open Extract\n", + "(2017-06-03 08:03:34)<< DONE (0.0s)\n", + "(2017-06-03 08:03:34)>> Run Pipeline\n", + "(2017-06-03 08:05:19)<< DONE (105.0s)\n", + "(2017-06-03 08:05:19)>> Analyze...\n", + "((1136938, 1), (389986, 2), 331666L, 17, '0.231% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"2\" halign=\"left\">norepinephrine</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mcg/kg/min</th>\n", + " <th>mcg/min</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>286781.000000</td>\n", + " <td>14226.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>0.141207</td>\n", + " <td>9.687762</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>0.343212</td>\n", + " <td>14.889317</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>0.035000</td>\n", + " <td>2.666667</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>0.080000</td>\n", + " <td>6.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>0.180000</td>\n", + " <td>12.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>50.000000</td>\n", + " <td>250.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label norepinephrine \n", + "status known \n", + "variable_type qn \n", + "units mcg/kg/min mcg/min\n", + "count 286781.000000 14226.000000\n", + "mean 0.141207 9.687762\n", + "std 0.343212 14.889317\n", + "min 0.000000 0.000000\n", + "25% 0.035000 2.666667\n", + "50% 0.080000 6.000000\n", + "75% 0.180000 12.000000\n", + "max 50.000000 250.000000" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 08:05:20)<< DONE (1.0s)\n", + "(2017-06-03 08:05:20)>> Joining!\n", + "(2017-06-03 08:05:58)<< DONE (38.0s)\n", + "(2017-06-03 08:05:58) DONE (144.0s)\n", + "(2017-06-03 08:05:58) vasopressin\n", + "(2017-06-03 08:05:58)>> Open Extract\n", + "(2017-06-03 08:05:58)<< DONE (0.0s)\n", + "(2017-06-03 08:05:58)>> Run Pipeline\n", + "(2017-06-03 08:06:20)<< DONE (22.0s)\n", + "(2017-06-03 08:06:20)>> Analyze...\n", + "((339184, 1), (110333, 2), 16608L, 8, '0.3406% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"2\" halign=\"left\">vasopressin</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>units</th>\n", + " <th>units/min</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>57371.000000</td>\n", + " <td>98872.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>2.517366</td>\n", + " <td>0.992521</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>4.842854</td>\n", + " <td>1.291858</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>1.800000</td>\n", + " <td>0.040000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>2.400000</td>\n", + " <td>0.044000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>2.400000</td>\n", + " <td>2.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>722.400000</td>\n", + " <td>50.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label vasopressin \n", + "status known \n", + "variable_type qn \n", + "units units units/min\n", + "count 57371.000000 98872.000000\n", + "mean 2.517366 0.992521\n", + "std 4.842854 1.291858\n", + "min 0.000000 0.000000\n", + "25% 1.800000 0.040000\n", + "50% 2.400000 0.044000\n", + "75% 2.400000 2.400000\n", + "max 722.400000 50.000000" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 08:06:20)<< DONE (0.0s)\n", + "(2017-06-03 08:06:20)>> Joining!\n", + "(2017-06-03 08:06:56)<< DONE (36.0s)\n", + "(2017-06-03 08:06:56) DONE (58.0s)\n", + "(2017-06-03 08:06:56) hemoglobin\n", + "(2017-06-03 08:06:56)>> Open Extract\n", + "(2017-06-03 08:06:56)<< DONE (0.0s)\n", + "(2017-06-03 08:06:56)>> Run Pipeline\n", + "(2017-06-03 08:07:52)<< DONE (56.0s)\n", + "(2017-06-03 08:07:52)>> Analyze...\n", + "((1167921, 1), (671087, 1), 641393L, 7, '0.0123% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>hemoglobin</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>g/dL</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>526528.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>10.351784</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>1.980592</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>9.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>10.100000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>11.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>130.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label hemoglobin\n", + "status known\n", + "variable_type qn\n", + "units g/dL\n", + "count 526528.000000\n", + "mean 10.351784\n", + "std 1.980592\n", + "min 0.000000\n", + "25% 9.000000\n", + "50% 10.100000\n", + "75% 11.400000\n", + "max 130.000000" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 08:07:52)<< DONE (0.0s)\n", + "(2017-06-03 08:07:52)>> Joining!\n", + "(2017-06-03 08:08:36)<< DONE (44.0s)\n", + "(2017-06-03 08:08:36) DONE (100.0s)\n", + "(2017-06-03 08:08:36) lactate\n", + "(2017-06-03 08:08:36)>> Open Extract\n", + "(2017-06-03 08:08:37)<< DONE (1.0s)\n", + "(2017-06-03 08:08:37)>> Run Pipeline\n", + "(2017-06-03 08:08:52)<< DONE (15.0s)\n", + "(2017-06-03 08:08:52)>> Analyze...\n", + "((393608, 1), (177439, 1), 216244L, 33, '0.0962% records')\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th>lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>mmol/L</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>177364.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>8.286749</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>2374.466306</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>1.200000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>1.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>2.900000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>999999.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label lactate\n", + "status known\n", + "variable_type qn\n", + "units mmol/L\n", + "count 177364.000000\n", + "mean 8.286749\n", + "std 2374.466306\n", + "min 0.000000\n", + "25% 1.200000\n", + "50% 1.800000\n", + "75% 2.900000\n", + "max 999999.000000" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-03 08:08:52)<< DONE (0.0s)\n", + "(2017-06-03 08:08:52)>> Joining!\n", + "(2017-06-03 08:09:35)<< DONE (43.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>heart rate</th>\n", + " <th>blood pressure systolic</th>\n", + " <th>blood pressure diastolic</th>\n", + " <th>blood pressure mean</th>\n", + " <th>respiratory rate</th>\n", + " <th>temperature body</th>\n", + " <th>oxygen saturation pulse oximetry</th>\n", + " <th>weight body</th>\n", + " <th>output urine</th>\n", + " <th>glasgow coma scale motor</th>\n", + " <th>...</th>\n", + " <th colspan=\"2\" halign=\"left\">normal saline</th>\n", + " <th colspan=\"2\" halign=\"left\">lactated ringers</th>\n", + " <th colspan=\"2\" halign=\"left\">norepinephrine</th>\n", + " <th colspan=\"2\" halign=\"left\">vasopressin</th>\n", + " <th>hemoglobin</th>\n", + " <th>lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>...</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>ord</th>\n", + " <th>...</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th>beats/min</th>\n", + " <th>mmHg</th>\n", + " <th>mmHg</th>\n", + " <th>mmHg</th>\n", + " <th>insp/min</th>\n", + " <th>degF</th>\n", + " <th>percent</th>\n", + " <th>kg</th>\n", + " <th>mL</th>\n", + " <th>no_units</th>\n", + " <th>...</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " <th>mcg/kg/min</th>\n", + " <th>mcg/min</th>\n", + " <th>units</th>\n", + " <th>units/min</th>\n", + " <th>g/dL</th>\n", + " <th>mmol/L</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"10\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 09:22:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>13.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 12:50:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>5.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 12:55:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>6.996487</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 12:57:00</th>\n", + " <td>122.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>14.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:00:00</th>\n", + " <td>118.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>22.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:01:00</th>\n", + " <td>NaN</td>\n", + " <td>192.0</td>\n", + " <td>100.0</td>\n", + " <td>122.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>499.999980</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:49:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>300.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:50:00</th>\n", + " <td>118.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>22.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>10 rows × 22 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label heart rate blood pressure systolic \\\n", + "status known known \n", + "variable_type qn qn \n", + "units beats/min mmHg \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 122.0 NaN \n", + " 2117-09-11 13:00:00 118.0 NaN \n", + " 2117-09-11 13:01:00 NaN 192.0 \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 118.0 NaN \n", + "\n", + "label blood pressure diastolic blood pressure mean \\\n", + "status known known \n", + "variable_type qn qn \n", + "units mmHg mmHg \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN \n", + " 2117-09-11 13:01:00 100.0 122.0 \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN \n", + "\n", + "label respiratory rate temperature body \\\n", + "status known known \n", + "variable_type qn qn \n", + "units insp/min degF \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 14.0 NaN \n", + " 2117-09-11 13:00:00 22.0 NaN \n", + " 2117-09-11 13:01:00 NaN NaN \n", + " 2117-09-11 13:48:00 NaN 98.0 \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 22.0 NaN \n", + "\n", + "label oxygen saturation pulse oximetry weight body \\\n", + "status known known \n", + "variable_type qn qn \n", + "units percent kg \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN \n", + "\n", + "label output urine glasgow coma scale motor ... \\\n", + "status known known ... \n", + "variable_type qn ord ... \n", + "units mL no_units ... \n", + "id datetime ... \n", + "100001 2117-09-11 09:22:00 NaN NaN ... \n", + " 2117-09-11 09:32:00 NaN NaN ... \n", + " 2117-09-11 12:50:00 NaN NaN ... \n", + " 2117-09-11 12:55:00 NaN NaN ... \n", + " 2117-09-11 12:57:00 NaN NaN ... \n", + " 2117-09-11 13:00:00 NaN NaN ... \n", + " 2117-09-11 13:01:00 NaN NaN ... \n", + " 2117-09-11 13:48:00 NaN NaN ... \n", + " 2117-09-11 13:49:00 300.0 NaN ... \n", + " 2117-09-11 13:50:00 NaN NaN ... \n", + "\n", + "label normal saline lactated ringers \\\n", + "status known known \n", + "variable_type qn qn \n", + "units mL mL/hr mL mL/hr \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:50:00 NaN 5.000000 NaN NaN \n", + " 2117-09-11 12:55:00 NaN 6.996487 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:48:00 NaN 499.999980 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN NaN NaN \n", + "\n", + "label norepinephrine vasopressin \\\n", + "status known known \n", + "variable_type qn qn \n", + "units mcg/kg/min mcg/min units units/min \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:48:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN NaN NaN \n", + "\n", + "label hemoglobin lactate \n", + "status known known \n", + "variable_type qn qn \n", + "units g/dL mmol/L \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 13.0 NaN \n", + " 2117-09-11 09:32:00 NaN 1.9 \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN \n", + "\n", + "[10 rows x 22 columns]" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "reload(logger)\n", + "simple_data = data_dict.get_panel_defintions(12) #12 is \"simple data\"\n", + "labels = simple_data.label.unique().tolist()\n", + "\n", + "df_final = None\n", + "for label in labels:\n", + " logger.log(label,new_level=True)\n", + " logger.log('Open Extract')\n", + " df_extract = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n", + "\n", + " logger.log('Run Pipeline')\n", + " all_pipeline.set_params(transform__add_level__level_val=label)\n", + " df = all_pipeline.transform(df_extract)\n", + " \n", + " logger.log('Analyze...')\n", + " print utils.data_loss(df_extract.set_index('id').value.to_frame(),df)\n", + " display(df.describe())\n", + "\n", + " logger.log('Joining!')\n", + "\n", + " if df_final is None: df_final = df\n", + " else: \n", + " df_final = df_final.join(df,how='outer')\n", + " del df\n", + " logger.end_log_level()\n", + "\n", + "df_final.head(10)" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>heart rate</th>\n", + " <th>blood pressure systolic</th>\n", + " <th>blood pressure diastolic</th>\n", + " <th>blood pressure mean</th>\n", + " <th>respiratory rate</th>\n", + " <th>temperature body</th>\n", + " <th>oxygen saturation pulse oximetry</th>\n", + " <th>weight body</th>\n", + " <th>output urine</th>\n", + " <th>glasgow coma scale motor</th>\n", + " <th>...</th>\n", + " <th colspan=\"2\" halign=\"left\">normal saline</th>\n", + " <th colspan=\"2\" halign=\"left\">lactated ringers</th>\n", + " <th colspan=\"2\" halign=\"left\">norepinephrine</th>\n", + " <th colspan=\"2\" halign=\"left\">vasopressin</th>\n", + " <th>hemoglobin</th>\n", + " <th>lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " <th>...</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th colspan=\"2\" halign=\"left\">known</th>\n", + " <th>known</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " <th>ord</th>\n", + " <th>...</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th colspan=\"2\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th>beats/min</th>\n", + " <th>mmHg</th>\n", + " <th>mmHg</th>\n", + " <th>mmHg</th>\n", + " <th>insp/min</th>\n", + " <th>degF</th>\n", + " <th>percent</th>\n", + " <th>kg</th>\n", + " <th>mL</th>\n", + " <th>no_units</th>\n", + " <th>...</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " <th>mL</th>\n", + " <th>mL/hr</th>\n", + " <th>mcg/kg/min</th>\n", + " <th>mcg/min</th>\n", + " <th>units</th>\n", + " <th>units/min</th>\n", + " <th>g/dL</th>\n", + " <th>mmol/L</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"30\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 09:22:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>13.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 12:50:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>5.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 12:55:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>6.996487</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 12:57:00</th>\n", + " <td>122.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>14.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:00:00</th>\n", + " <td>118.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>22.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:01:00</th>\n", + " <td>NaN</td>\n", + " <td>192.0</td>\n", + " <td>100.0</td>\n", + " <td>122.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>499.999980</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:49:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>300.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 13:50:00</th>\n", + " <td>118.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>22.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 14:00:00</th>\n", + " <td>118.0</td>\n", + " <td>165.0</td>\n", + " <td>85.0</td>\n", + " <td>103.0</td>\n", + " <td>15.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>8.990600</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 15:00:00</th>\n", + " <td>110.0</td>\n", + " <td>119.0</td>\n", + " <td>64.0</td>\n", + " <td>76.0</td>\n", + " <td>15.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 15:48:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>999.999960</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 15:59:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>199.999998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:00:00</th>\n", + " <td>104.0</td>\n", + " <td>169.0</td>\n", + " <td>84.0</td>\n", + " <td>105.0</td>\n", + " <td>16.0</td>\n", + " <td>97.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:02:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:11:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>40.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:12:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>4.992476</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 17:00:00</th>\n", + " <td>101.0</td>\n", + " <td>110.0</td>\n", + " <td>62.0</td>\n", + " <td>75.0</td>\n", + " <td>15.0</td>\n", + " <td>NaN</td>\n", + " <td>97.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 18:00:00</th>\n", + " <td>112.0</td>\n", + " <td>170.0</td>\n", + " <td>86.0</td>\n", + " <td>106.0</td>\n", + " <td>16.0</td>\n", + " <td>NaN</td>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 18:34:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>400.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:00:00</th>\n", + " <td>108.0</td>\n", + " <td>179.0</td>\n", + " <td>88.0</td>\n", + " <td>110.0</td>\n", + " <td>NaN</td>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:31:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>11.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 20:00:00</th>\n", + " <td>116.0</td>\n", + " <td>183.0</td>\n", + " <td>91.0</td>\n", + " <td>114.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 21:00:00</th>\n", + " <td>117.0</td>\n", + " <td>189.0</td>\n", + " <td>98.0</td>\n", + " <td>121.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 21:12:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>3.396080</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 21:16:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>5.012718</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <td>124.0</td>\n", + " <td>180.0</td>\n", + " <td>88.0</td>\n", + " <td>110.0</td>\n", + " <td>NaN</td>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>200.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:10:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:25:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>500.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"30\" valign=\"top\">199999</th>\n", + " <th>2136-04-09 09:00:00</th>\n", + " <td>79.0</td>\n", + " <td>130.0</td>\n", + " <td>48.0</td>\n", + " <td>69.0</td>\n", + " <td>25.0</td>\n", + " <td>NaN</td>\n", + " <td>95.0</td>\n", + " <td>NaN</td>\n", + " <td>350.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 10:00:00</th>\n", + " <td>81.0</td>\n", + " <td>123.0</td>\n", + " <td>64.0</td>\n", + " <td>80.0</td>\n", + " <td>24.0</td>\n", + " <td>NaN</td>\n", + " <td>94.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 11:00:00</th>\n", + " <td>89.0</td>\n", + " <td>115.0</td>\n", + " <td>57.0</td>\n", + " <td>70.0</td>\n", + " <td>16.0</td>\n", + " <td>NaN</td>\n", + " <td>94.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 12:00:00</th>\n", + " <td>72.0</td>\n", + " <td>119.0</td>\n", + " <td>45.0</td>\n", + " <td>65.0</td>\n", + " <td>24.0</td>\n", + " <td>98.3</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 13:00:00</th>\n", + " <td>82.0</td>\n", + " <td>156.0</td>\n", + " <td>58.0</td>\n", + " <td>78.0</td>\n", + " <td>22.0</td>\n", + " <td>NaN</td>\n", + " <td>94.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 14:00:00</th>\n", + " <td>74.0</td>\n", + " <td>128.0</td>\n", + " <td>53.0</td>\n", + " <td>72.0</td>\n", + " <td>28.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 15:00:00</th>\n", + " <td>69.0</td>\n", + " <td>129.0</td>\n", + " <td>49.0</td>\n", + " <td>69.0</td>\n", + " <td>26.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 16:00:00</th>\n", + " <td>71.0</td>\n", + " <td>133.0</td>\n", + " <td>46.0</td>\n", + " <td>70.0</td>\n", + " <td>27.0</td>\n", + " <td>98.0</td>\n", + " <td>94.0</td>\n", + " <td>NaN</td>\n", + " <td>400.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 17:00:00</th>\n", + " <td>68.0</td>\n", + " <td>150.0</td>\n", + " <td>55.0</td>\n", + " <td>79.0</td>\n", + " <td>24.0</td>\n", + " <td>NaN</td>\n", + " <td>94.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 18:00:00</th>\n", + " <td>90.0</td>\n", + " <td>146.0</td>\n", + " <td>53.0</td>\n", + " <td>79.0</td>\n", + " <td>24.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 19:00:00</th>\n", + " <td>78.0</td>\n", + " <td>134.0</td>\n", + " <td>50.0</td>\n", + " <td>72.0</td>\n", + " <td>26.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 20:00:00</th>\n", + " <td>82.0</td>\n", + " <td>142.0</td>\n", + " <td>52.0</td>\n", + " <td>75.0</td>\n", + " <td>23.0</td>\n", + " <td>97.4</td>\n", + " <td>95.0</td>\n", + " <td>NaN</td>\n", + " <td>480.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 21:00:00</th>\n", + " <td>81.0</td>\n", + " <td>132.0</td>\n", + " <td>50.0</td>\n", + " <td>70.0</td>\n", + " <td>29.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 22:00:00</th>\n", + " <td>72.0</td>\n", + " <td>112.0</td>\n", + " <td>48.0</td>\n", + " <td>62.0</td>\n", + " <td>25.0</td>\n", + " <td>NaN</td>\n", + " <td>97.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 23:00:00</th>\n", + " <td>65.0</td>\n", + " <td>129.0</td>\n", + " <td>42.0</td>\n", + " <td>66.0</td>\n", + " <td>24.0</td>\n", + " <td>NaN</td>\n", + " <td>96.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 00:00:00</th>\n", + " <td>80.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>25.0</td>\n", + " <td>97.4</td>\n", + " <td>94.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 00:01:00</th>\n", + " <td>NaN</td>\n", + " <td>128.0</td>\n", + " <td>59.0</td>\n", + " <td>75.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 01:00:00</th>\n", + " <td>80.0</td>\n", + " <td>124.0</td>\n", + " <td>59.0</td>\n", + " <td>75.0</td>\n", + " <td>26.0</td>\n", + " <td>NaN</td>\n", + " <td>95.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 02:00:00</th>\n", + " <td>76.0</td>\n", + " <td>130.0</td>\n", + " <td>49.0</td>\n", + " <td>68.0</td>\n", + " <td>26.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>350.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 02:28:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>12.6</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 03:00:00</th>\n", + " <td>72.0</td>\n", + " <td>126.0</td>\n", + " <td>37.0</td>\n", + " <td>61.0</td>\n", + " <td>27.0</td>\n", + " <td>97.4</td>\n", + " <td>91.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 04:00:00</th>\n", + " <td>66.0</td>\n", + " <td>126.0</td>\n", + " <td>31.0</td>\n", + " <td>52.0</td>\n", + " <td>26.0</td>\n", + " <td>NaN</td>\n", + " <td>95.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 05:00:00</th>\n", + " <td>66.0</td>\n", + " <td>129.0</td>\n", + " <td>39.0</td>\n", + " <td>63.0</td>\n", + " <td>27.0</td>\n", + " <td>NaN</td>\n", + " <td>96.0</td>\n", + " <td>NaN</td>\n", + " <td>330.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 06:00:00</th>\n", + " <td>65.0</td>\n", + " <td>143.0</td>\n", + " <td>47.0</td>\n", + " <td>71.0</td>\n", + " <td>19.0</td>\n", + " <td>NaN</td>\n", + " <td>92.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 07:00:00</th>\n", + " <td>79.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>28.0</td>\n", + " <td>NaN</td>\n", + " <td>92.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 08:00:00</th>\n", + " <td>69.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>24.0</td>\n", + " <td>98.1</td>\n", + " <td>96.0</td>\n", + " <td>NaN</td>\n", + " <td>200.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 09:00:00</th>\n", + " <td>79.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>24.0</td>\n", + " <td>NaN</td>\n", + " <td>93.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 09:10:00</th>\n", + " <td>NaN</td>\n", + " <td>128.0</td>\n", + " <td>81.0</td>\n", + " <td>89.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 10:00:00</th>\n", + " <td>72.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>26.0</td>\n", + " <td>NaN</td>\n", + " <td>97.0</td>\n", + " <td>NaN</td>\n", + " <td>200.0</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 11:00:00</th>\n", + " <td>72.0</td>\n", + " <td>144.0</td>\n", + " <td>123.0</td>\n", + " <td>128.0</td>\n", + " <td>24.0</td>\n", + " <td>NaN</td>\n", + " <td>96.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>...</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>10071464 rows × 22 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label heart rate blood pressure systolic \\\n", + "status known known \n", + "variable_type qn qn \n", + "units beats/min mmHg \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 122.0 NaN \n", + " 2117-09-11 13:00:00 118.0 NaN \n", + " 2117-09-11 13:01:00 NaN 192.0 \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 118.0 NaN \n", + " 2117-09-11 14:00:00 118.0 165.0 \n", + " 2117-09-11 15:00:00 110.0 119.0 \n", + " 2117-09-11 15:48:00 NaN NaN \n", + " 2117-09-11 15:59:00 NaN NaN \n", + " 2117-09-11 16:00:00 104.0 169.0 \n", + " 2117-09-11 16:02:00 NaN NaN \n", + " 2117-09-11 16:11:00 NaN NaN \n", + " 2117-09-11 16:12:00 NaN NaN \n", + " 2117-09-11 17:00:00 101.0 110.0 \n", + " 2117-09-11 18:00:00 112.0 170.0 \n", + " 2117-09-11 18:34:00 NaN NaN \n", + " 2117-09-11 19:00:00 108.0 179.0 \n", + " 2117-09-11 19:31:00 NaN NaN \n", + " 2117-09-11 20:00:00 116.0 183.0 \n", + " 2117-09-11 21:00:00 117.0 189.0 \n", + " 2117-09-11 21:12:00 NaN NaN \n", + " 2117-09-11 21:16:00 NaN NaN \n", + " 2117-09-11 22:00:00 124.0 180.0 \n", + " 2117-09-11 22:10:00 NaN NaN \n", + " 2117-09-11 22:25:00 NaN NaN \n", + "... ... ... \n", + "199999 2136-04-09 09:00:00 79.0 130.0 \n", + " 2136-04-09 10:00:00 81.0 123.0 \n", + " 2136-04-09 11:00:00 89.0 115.0 \n", + " 2136-04-09 12:00:00 72.0 119.0 \n", + " 2136-04-09 13:00:00 82.0 156.0 \n", + " 2136-04-09 14:00:00 74.0 128.0 \n", + " 2136-04-09 15:00:00 69.0 129.0 \n", + " 2136-04-09 16:00:00 71.0 133.0 \n", + " 2136-04-09 17:00:00 68.0 150.0 \n", + " 2136-04-09 18:00:00 90.0 146.0 \n", + " 2136-04-09 19:00:00 78.0 134.0 \n", + " 2136-04-09 20:00:00 82.0 142.0 \n", + " 2136-04-09 21:00:00 81.0 132.0 \n", + " 2136-04-09 22:00:00 72.0 112.0 \n", + " 2136-04-09 23:00:00 65.0 129.0 \n", + " 2136-04-10 00:00:00 80.0 NaN \n", + " 2136-04-10 00:01:00 NaN 128.0 \n", + " 2136-04-10 01:00:00 80.0 124.0 \n", + " 2136-04-10 02:00:00 76.0 130.0 \n", + " 2136-04-10 02:28:00 NaN NaN \n", + " 2136-04-10 03:00:00 72.0 126.0 \n", + " 2136-04-10 04:00:00 66.0 126.0 \n", + " 2136-04-10 05:00:00 66.0 129.0 \n", + " 2136-04-10 06:00:00 65.0 143.0 \n", + " 2136-04-10 07:00:00 79.0 NaN \n", + " 2136-04-10 08:00:00 69.0 NaN \n", + " 2136-04-10 09:00:00 79.0 NaN \n", + " 2136-04-10 09:10:00 NaN 128.0 \n", + " 2136-04-10 10:00:00 72.0 NaN \n", + " 2136-04-10 11:00:00 72.0 144.0 \n", + "\n", + "label blood pressure diastolic blood pressure mean \\\n", + "status known known \n", + "variable_type qn qn \n", + "units mmHg mmHg \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN \n", + " 2117-09-11 13:01:00 100.0 122.0 \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN \n", + " 2117-09-11 14:00:00 85.0 103.0 \n", + " 2117-09-11 15:00:00 64.0 76.0 \n", + " 2117-09-11 15:48:00 NaN NaN \n", + " 2117-09-11 15:59:00 NaN NaN \n", + " 2117-09-11 16:00:00 84.0 105.0 \n", + " 2117-09-11 16:02:00 NaN NaN \n", + " 2117-09-11 16:11:00 NaN NaN \n", + " 2117-09-11 16:12:00 NaN NaN \n", + " 2117-09-11 17:00:00 62.0 75.0 \n", + " 2117-09-11 18:00:00 86.0 106.0 \n", + " 2117-09-11 18:34:00 NaN NaN \n", + " 2117-09-11 19:00:00 88.0 110.0 \n", + " 2117-09-11 19:31:00 NaN NaN \n", + " 2117-09-11 20:00:00 91.0 114.0 \n", + " 2117-09-11 21:00:00 98.0 121.0 \n", + " 2117-09-11 21:12:00 NaN NaN \n", + " 2117-09-11 21:16:00 NaN NaN \n", + " 2117-09-11 22:00:00 88.0 110.0 \n", + " 2117-09-11 22:10:00 NaN NaN \n", + " 2117-09-11 22:25:00 NaN NaN \n", + "... ... ... \n", + "199999 2136-04-09 09:00:00 48.0 69.0 \n", + " 2136-04-09 10:00:00 64.0 80.0 \n", + " 2136-04-09 11:00:00 57.0 70.0 \n", + " 2136-04-09 12:00:00 45.0 65.0 \n", + " 2136-04-09 13:00:00 58.0 78.0 \n", + " 2136-04-09 14:00:00 53.0 72.0 \n", + " 2136-04-09 15:00:00 49.0 69.0 \n", + " 2136-04-09 16:00:00 46.0 70.0 \n", + " 2136-04-09 17:00:00 55.0 79.0 \n", + " 2136-04-09 18:00:00 53.0 79.0 \n", + " 2136-04-09 19:00:00 50.0 72.0 \n", + " 2136-04-09 20:00:00 52.0 75.0 \n", + " 2136-04-09 21:00:00 50.0 70.0 \n", + " 2136-04-09 22:00:00 48.0 62.0 \n", + " 2136-04-09 23:00:00 42.0 66.0 \n", + " 2136-04-10 00:00:00 NaN NaN \n", + " 2136-04-10 00:01:00 59.0 75.0 \n", + " 2136-04-10 01:00:00 59.0 75.0 \n", + " 2136-04-10 02:00:00 49.0 68.0 \n", + " 2136-04-10 02:28:00 NaN NaN \n", + " 2136-04-10 03:00:00 37.0 61.0 \n", + " 2136-04-10 04:00:00 31.0 52.0 \n", + " 2136-04-10 05:00:00 39.0 63.0 \n", + " 2136-04-10 06:00:00 47.0 71.0 \n", + " 2136-04-10 07:00:00 NaN NaN \n", + " 2136-04-10 08:00:00 NaN NaN \n", + " 2136-04-10 09:00:00 NaN NaN \n", + " 2136-04-10 09:10:00 81.0 89.0 \n", + " 2136-04-10 10:00:00 NaN NaN \n", + " 2136-04-10 11:00:00 123.0 128.0 \n", + "\n", + "label respiratory rate temperature body \\\n", + "status known known \n", + "variable_type qn qn \n", + "units insp/min degF \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 14.0 NaN \n", + " 2117-09-11 13:00:00 22.0 NaN \n", + " 2117-09-11 13:01:00 NaN NaN \n", + " 2117-09-11 13:48:00 NaN 98.0 \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 22.0 NaN \n", + " 2117-09-11 14:00:00 15.0 NaN \n", + " 2117-09-11 15:00:00 15.0 NaN \n", + " 2117-09-11 15:48:00 NaN NaN \n", + " 2117-09-11 15:59:00 NaN NaN \n", + " 2117-09-11 16:00:00 16.0 97.9 \n", + " 2117-09-11 16:02:00 NaN NaN \n", + " 2117-09-11 16:11:00 NaN NaN \n", + " 2117-09-11 16:12:00 NaN NaN \n", + " 2117-09-11 17:00:00 15.0 NaN \n", + " 2117-09-11 18:00:00 16.0 NaN \n", + " 2117-09-11 18:34:00 NaN NaN \n", + " 2117-09-11 19:00:00 NaN 99.5 \n", + " 2117-09-11 19:31:00 NaN NaN \n", + " 2117-09-11 20:00:00 NaN NaN \n", + " 2117-09-11 21:00:00 NaN NaN \n", + " 2117-09-11 21:12:00 NaN NaN \n", + " 2117-09-11 21:16:00 NaN NaN \n", + " 2117-09-11 22:00:00 NaN 100.0 \n", + " 2117-09-11 22:10:00 NaN NaN \n", + " 2117-09-11 22:25:00 NaN NaN \n", + "... ... ... \n", + "199999 2136-04-09 09:00:00 25.0 NaN \n", + " 2136-04-09 10:00:00 24.0 NaN \n", + " 2136-04-09 11:00:00 16.0 NaN \n", + " 2136-04-09 12:00:00 24.0 98.3 \n", + " 2136-04-09 13:00:00 22.0 NaN \n", + " 2136-04-09 14:00:00 28.0 NaN \n", + " 2136-04-09 15:00:00 26.0 NaN \n", + " 2136-04-09 16:00:00 27.0 98.0 \n", + " 2136-04-09 17:00:00 24.0 NaN \n", + " 2136-04-09 18:00:00 24.0 NaN \n", + " 2136-04-09 19:00:00 26.0 NaN \n", + " 2136-04-09 20:00:00 23.0 97.4 \n", + " 2136-04-09 21:00:00 29.0 NaN \n", + " 2136-04-09 22:00:00 25.0 NaN \n", + " 2136-04-09 23:00:00 24.0 NaN \n", + " 2136-04-10 00:00:00 25.0 97.4 \n", + " 2136-04-10 00:01:00 NaN NaN \n", + " 2136-04-10 01:00:00 26.0 NaN \n", + " 2136-04-10 02:00:00 26.0 NaN \n", + " 2136-04-10 02:28:00 NaN NaN \n", + " 2136-04-10 03:00:00 27.0 97.4 \n", + " 2136-04-10 04:00:00 26.0 NaN \n", + " 2136-04-10 05:00:00 27.0 NaN \n", + " 2136-04-10 06:00:00 19.0 NaN \n", + " 2136-04-10 07:00:00 28.0 NaN \n", + " 2136-04-10 08:00:00 24.0 98.1 \n", + " 2136-04-10 09:00:00 24.0 NaN \n", + " 2136-04-10 09:10:00 NaN NaN \n", + " 2136-04-10 10:00:00 26.0 NaN \n", + " 2136-04-10 11:00:00 24.0 NaN \n", + "\n", + "label oxygen saturation pulse oximetry weight body \\\n", + "status known known \n", + "variable_type qn qn \n", + "units percent kg \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN \n", + " 2117-09-11 14:00:00 NaN NaN \n", + " 2117-09-11 15:00:00 NaN NaN \n", + " 2117-09-11 15:48:00 NaN NaN \n", + " 2117-09-11 15:59:00 NaN NaN \n", + " 2117-09-11 16:00:00 NaN NaN \n", + " 2117-09-11 16:02:00 100.0 NaN \n", + " 2117-09-11 16:11:00 NaN NaN \n", + " 2117-09-11 16:12:00 NaN NaN \n", + " 2117-09-11 17:00:00 97.0 NaN \n", + " 2117-09-11 18:00:00 98.0 NaN \n", + " 2117-09-11 18:34:00 NaN NaN \n", + " 2117-09-11 19:00:00 NaN NaN \n", + " 2117-09-11 19:31:00 NaN NaN \n", + " 2117-09-11 20:00:00 97.0 NaN \n", + " 2117-09-11 21:00:00 NaN NaN \n", + " 2117-09-11 21:12:00 NaN NaN \n", + " 2117-09-11 21:16:00 NaN NaN \n", + " 2117-09-11 22:00:00 NaN NaN \n", + " 2117-09-11 22:10:00 97.0 NaN \n", + " 2117-09-11 22:25:00 NaN NaN \n", + "... ... ... \n", + "199999 2136-04-09 09:00:00 95.0 NaN \n", + " 2136-04-09 10:00:00 94.0 NaN \n", + " 2136-04-09 11:00:00 94.0 NaN \n", + " 2136-04-09 12:00:00 93.0 NaN \n", + " 2136-04-09 13:00:00 94.0 NaN \n", + " 2136-04-09 14:00:00 93.0 NaN \n", + " 2136-04-09 15:00:00 93.0 NaN \n", + " 2136-04-09 16:00:00 94.0 NaN \n", + " 2136-04-09 17:00:00 94.0 NaN \n", + " 2136-04-09 18:00:00 93.0 NaN \n", + " 2136-04-09 19:00:00 93.0 NaN \n", + " 2136-04-09 20:00:00 95.0 NaN \n", + " 2136-04-09 21:00:00 93.0 NaN \n", + " 2136-04-09 22:00:00 97.0 NaN \n", + " 2136-04-09 23:00:00 96.0 NaN \n", + " 2136-04-10 00:00:00 94.0 NaN \n", + " 2136-04-10 00:01:00 NaN NaN \n", + " 2136-04-10 01:00:00 95.0 NaN \n", + " 2136-04-10 02:00:00 93.0 NaN \n", + " 2136-04-10 02:28:00 NaN NaN \n", + " 2136-04-10 03:00:00 91.0 NaN \n", + " 2136-04-10 04:00:00 95.0 NaN \n", + " 2136-04-10 05:00:00 96.0 NaN \n", + " 2136-04-10 06:00:00 92.0 NaN \n", + " 2136-04-10 07:00:00 92.0 NaN \n", + " 2136-04-10 08:00:00 96.0 NaN \n", + " 2136-04-10 09:00:00 93.0 NaN \n", + " 2136-04-10 09:10:00 NaN NaN \n", + " 2136-04-10 10:00:00 97.0 NaN \n", + " 2136-04-10 11:00:00 96.0 NaN \n", + "\n", + "label output urine glasgow coma scale motor ... \\\n", + "status known known ... \n", + "variable_type qn ord ... \n", + "units mL no_units ... \n", + "id datetime ... \n", + "100001 2117-09-11 09:22:00 NaN NaN ... \n", + " 2117-09-11 09:32:00 NaN NaN ... \n", + " 2117-09-11 12:50:00 NaN NaN ... \n", + " 2117-09-11 12:55:00 NaN NaN ... \n", + " 2117-09-11 12:57:00 NaN NaN ... \n", + " 2117-09-11 13:00:00 NaN NaN ... \n", + " 2117-09-11 13:01:00 NaN NaN ... \n", + " 2117-09-11 13:48:00 NaN NaN ... \n", + " 2117-09-11 13:49:00 300.0 NaN ... \n", + " 2117-09-11 13:50:00 NaN NaN ... \n", + " 2117-09-11 14:00:00 NaN NaN ... \n", + " 2117-09-11 15:00:00 NaN NaN ... \n", + " 2117-09-11 15:48:00 NaN NaN ... \n", + " 2117-09-11 15:59:00 NaN NaN ... \n", + " 2117-09-11 16:00:00 NaN NaN ... \n", + " 2117-09-11 16:02:00 NaN NaN ... \n", + " 2117-09-11 16:11:00 NaN NaN ... \n", + " 2117-09-11 16:12:00 NaN NaN ... \n", + " 2117-09-11 17:00:00 NaN NaN ... \n", + " 2117-09-11 18:00:00 NaN NaN ... \n", + " 2117-09-11 18:34:00 400.0 NaN ... \n", + " 2117-09-11 19:00:00 NaN NaN ... \n", + " 2117-09-11 19:31:00 NaN NaN ... \n", + " 2117-09-11 20:00:00 NaN NaN ... \n", + " 2117-09-11 21:00:00 NaN NaN ... \n", + " 2117-09-11 21:12:00 NaN NaN ... \n", + " 2117-09-11 21:16:00 NaN NaN ... \n", + " 2117-09-11 22:00:00 200.0 NaN ... \n", + " 2117-09-11 22:10:00 NaN NaN ... \n", + " 2117-09-11 22:25:00 NaN NaN ... \n", + "... ... ... ... \n", + "199999 2136-04-09 09:00:00 350.0 NaN ... \n", + " 2136-04-09 10:00:00 NaN NaN ... \n", + " 2136-04-09 11:00:00 NaN NaN ... \n", + " 2136-04-09 12:00:00 NaN NaN ... \n", + " 2136-04-09 13:00:00 NaN NaN ... \n", + " 2136-04-09 14:00:00 NaN NaN ... \n", + " 2136-04-09 15:00:00 NaN NaN ... \n", + " 2136-04-09 16:00:00 400.0 NaN ... \n", + " 2136-04-09 17:00:00 NaN NaN ... \n", + " 2136-04-09 18:00:00 NaN NaN ... \n", + " 2136-04-09 19:00:00 NaN NaN ... \n", + " 2136-04-09 20:00:00 480.0 NaN ... \n", + " 2136-04-09 21:00:00 NaN NaN ... \n", + " 2136-04-09 22:00:00 NaN NaN ... \n", + " 2136-04-09 23:00:00 NaN NaN ... \n", + " 2136-04-10 00:00:00 NaN NaN ... \n", + " 2136-04-10 00:01:00 NaN NaN ... \n", + " 2136-04-10 01:00:00 NaN NaN ... \n", + " 2136-04-10 02:00:00 350.0 NaN ... \n", + " 2136-04-10 02:28:00 NaN NaN ... \n", + " 2136-04-10 03:00:00 NaN NaN ... \n", + " 2136-04-10 04:00:00 NaN NaN ... \n", + " 2136-04-10 05:00:00 330.0 NaN ... \n", + " 2136-04-10 06:00:00 NaN NaN ... \n", + " 2136-04-10 07:00:00 NaN NaN ... \n", + " 2136-04-10 08:00:00 200.0 NaN ... \n", + " 2136-04-10 09:00:00 NaN NaN ... \n", + " 2136-04-10 09:10:00 NaN NaN ... \n", + " 2136-04-10 10:00:00 200.0 NaN ... \n", + " 2136-04-10 11:00:00 NaN NaN ... \n", + "\n", + "label normal saline lactated ringers \\\n", + "status known known \n", + "variable_type qn qn \n", + "units mL mL/hr mL mL/hr \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:50:00 NaN 5.000000 NaN NaN \n", + " 2117-09-11 12:55:00 NaN 6.996487 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:48:00 NaN 499.999980 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN NaN NaN \n", + " 2117-09-11 14:00:00 NaN 8.990600 NaN NaN \n", + " 2117-09-11 15:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 15:48:00 NaN 999.999960 NaN NaN \n", + " 2117-09-11 15:59:00 NaN 199.999998 NaN NaN \n", + " 2117-09-11 16:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 16:02:00 NaN NaN NaN NaN \n", + " 2117-09-11 16:11:00 NaN 40.000000 NaN NaN \n", + " 2117-09-11 16:12:00 NaN 4.992476 NaN NaN \n", + " 2117-09-11 17:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 18:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 18:34:00 NaN NaN NaN NaN \n", + " 2117-09-11 19:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 19:31:00 NaN NaN NaN NaN \n", + " 2117-09-11 20:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 21:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 21:12:00 NaN 3.396080 NaN NaN \n", + " 2117-09-11 21:16:00 NaN 5.012718 NaN NaN \n", + " 2117-09-11 22:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 22:10:00 NaN NaN NaN NaN \n", + " 2117-09-11 22:25:00 500.0 NaN NaN NaN \n", + "... ... ... ... ... \n", + "199999 2136-04-09 09:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 10:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 11:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 12:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 13:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 14:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 15:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 16:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 17:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 18:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 19:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 20:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 21:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 22:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 23:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 00:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 00:01:00 NaN NaN NaN NaN \n", + " 2136-04-10 01:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 02:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 02:28:00 NaN NaN NaN NaN \n", + " 2136-04-10 03:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 04:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 05:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 06:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 07:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 08:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 09:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 09:10:00 NaN NaN NaN NaN \n", + " 2136-04-10 10:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 11:00:00 NaN NaN NaN NaN \n", + "\n", + "label norepinephrine vasopressin \\\n", + "status known known \n", + "variable_type qn qn \n", + "units mcg/kg/min mcg/min units units/min \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 NaN NaN NaN NaN \n", + " 2117-09-11 09:32:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:50:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:48:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN NaN NaN \n", + " 2117-09-11 14:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 15:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 15:48:00 NaN NaN NaN NaN \n", + " 2117-09-11 15:59:00 NaN NaN NaN NaN \n", + " 2117-09-11 16:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 16:02:00 NaN NaN NaN NaN \n", + " 2117-09-11 16:11:00 NaN NaN NaN NaN \n", + " 2117-09-11 16:12:00 NaN NaN NaN NaN \n", + " 2117-09-11 17:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 18:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 18:34:00 NaN NaN NaN NaN \n", + " 2117-09-11 19:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 19:31:00 NaN NaN NaN NaN \n", + " 2117-09-11 20:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 21:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 21:12:00 NaN NaN NaN NaN \n", + " 2117-09-11 21:16:00 NaN NaN NaN NaN \n", + " 2117-09-11 22:00:00 NaN NaN NaN NaN \n", + " 2117-09-11 22:10:00 NaN NaN NaN NaN \n", + " 2117-09-11 22:25:00 NaN NaN NaN NaN \n", + "... ... ... ... ... \n", + "199999 2136-04-09 09:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 10:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 11:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 12:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 13:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 14:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 15:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 16:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 17:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 18:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 19:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 20:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 21:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 22:00:00 NaN NaN NaN NaN \n", + " 2136-04-09 23:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 00:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 00:01:00 NaN NaN NaN NaN \n", + " 2136-04-10 01:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 02:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 02:28:00 NaN NaN NaN NaN \n", + " 2136-04-10 03:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 04:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 05:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 06:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 07:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 08:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 09:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 09:10:00 NaN NaN NaN NaN \n", + " 2136-04-10 10:00:00 NaN NaN NaN NaN \n", + " 2136-04-10 11:00:00 NaN NaN NaN NaN \n", + "\n", + "label hemoglobin lactate \n", + "status known known \n", + "variable_type qn qn \n", + "units g/dL mmol/L \n", + "id datetime \n", + "100001 2117-09-11 09:22:00 13.0 NaN \n", + " 2117-09-11 09:32:00 NaN 1.9 \n", + " 2117-09-11 12:50:00 NaN NaN \n", + " 2117-09-11 12:55:00 NaN NaN \n", + " 2117-09-11 12:57:00 NaN NaN \n", + " 2117-09-11 13:00:00 NaN NaN \n", + " 2117-09-11 13:01:00 NaN NaN \n", + " 2117-09-11 13:48:00 NaN NaN \n", + " 2117-09-11 13:49:00 NaN NaN \n", + " 2117-09-11 13:50:00 NaN NaN \n", + " 2117-09-11 14:00:00 NaN NaN \n", + " 2117-09-11 15:00:00 NaN NaN \n", + " 2117-09-11 15:48:00 NaN NaN \n", + " 2117-09-11 15:59:00 NaN NaN \n", + " 2117-09-11 16:00:00 NaN NaN \n", + " 2117-09-11 16:02:00 NaN NaN \n", + " 2117-09-11 16:11:00 NaN NaN \n", + " 2117-09-11 16:12:00 NaN NaN \n", + " 2117-09-11 17:00:00 NaN NaN \n", + " 2117-09-11 18:00:00 NaN NaN \n", + " 2117-09-11 18:34:00 NaN NaN \n", + " 2117-09-11 19:00:00 NaN NaN \n", + " 2117-09-11 19:31:00 11.0 NaN \n", + " 2117-09-11 20:00:00 NaN NaN \n", + " 2117-09-11 21:00:00 NaN NaN \n", + " 2117-09-11 21:12:00 NaN NaN \n", + " 2117-09-11 21:16:00 NaN NaN \n", + " 2117-09-11 22:00:00 NaN NaN \n", + " 2117-09-11 22:10:00 NaN NaN \n", + " 2117-09-11 22:25:00 NaN NaN \n", + "... ... ... \n", + "199999 2136-04-09 09:00:00 NaN NaN \n", + " 2136-04-09 10:00:00 NaN NaN \n", + " 2136-04-09 11:00:00 NaN NaN \n", + " 2136-04-09 12:00:00 NaN NaN \n", + " 2136-04-09 13:00:00 NaN NaN \n", + " 2136-04-09 14:00:00 NaN NaN \n", + " 2136-04-09 15:00:00 NaN NaN \n", + " 2136-04-09 16:00:00 NaN NaN \n", + " 2136-04-09 17:00:00 NaN NaN \n", + " 2136-04-09 18:00:00 NaN NaN \n", + " 2136-04-09 19:00:00 NaN NaN \n", + " 2136-04-09 20:00:00 NaN NaN \n", + " 2136-04-09 21:00:00 NaN NaN \n", + " 2136-04-09 22:00:00 NaN NaN \n", + " 2136-04-09 23:00:00 NaN NaN \n", + " 2136-04-10 00:00:00 NaN NaN \n", + " 2136-04-10 00:01:00 NaN NaN \n", + " 2136-04-10 01:00:00 NaN NaN \n", + " 2136-04-10 02:00:00 NaN NaN \n", + " 2136-04-10 02:28:00 12.6 NaN \n", + " 2136-04-10 03:00:00 NaN NaN \n", + " 2136-04-10 04:00:00 NaN NaN \n", + " 2136-04-10 05:00:00 NaN NaN \n", + " 2136-04-10 06:00:00 NaN NaN \n", + " 2136-04-10 07:00:00 NaN NaN \n", + " 2136-04-10 08:00:00 NaN NaN \n", + " 2136-04-10 09:00:00 NaN NaN \n", + " 2136-04-10 09:10:00 NaN NaN \n", + " 2136-04-10 10:00:00 NaN NaN \n", + " 2136-04-10 11:00:00 NaN NaN \n", + "\n", + "[10071464 rows x 22 columns]" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "utils.save_df(df_final,hdf5_fname,'cleaned/test1')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Prepare for ML\n", + "\n", + "\n", + "1. All categories to numeric representations\n", + "2. Segment, add to index\n", + "3. Transform into features (FeatureUnion)" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "intro_pipeline = Pipeline([\n", + " ('transform',mimic_transform),\n", + " ('format',standard_pipeline),\n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"8\" halign=\"left\">lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " <th colspan=\"4\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th colspan=\"3\" halign=\"left\">nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">mmol/L</th>\n", + " <th>no_units</th>\n", + " <th colspan=\"3\" halign=\"left\">no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>50813</th>\n", + " <th>225668</th>\n", + " <th>818</th>\n", + " <th>1531</th>\n", + " <th>225668</th>\n", + " <th>50813(mmol/L)</th>\n", + " <th>818(mmol/L)</th>\n", + " <th>1531(mmol/L)</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>100001</th>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100003</th>\n", + " <th>2150-04-17 19:12:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100006</th>\n", + " <th>2108-04-08 10:58:00</th>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100007</th>\n", + " <th>2145-03-31 00:44:00</th>\n", + " <td>3.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2145-04-02 14:10:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label lactate \\\n", + "status known unknown \n", + "variable_type qn qn nom \n", + "units mmol/L no_units no_units \n", + "description 50813 225668 818 1531 225668 50813(mmol/L) \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 1.9 NaN NaN NaN NaN NaN \n", + "100003 2150-04-17 19:12:00 1.1 1.1 NaN NaN NaN NaN \n", + "100006 2108-04-08 10:58:00 4.5 NaN 4.5 NaN NaN NaN \n", + "100007 2145-03-31 00:44:00 3.1 NaN NaN NaN NaN NaN \n", + " 2145-04-02 14:10:00 1.9 NaN NaN NaN NaN NaN \n", + "\n", + "label \n", + "status \n", + "variable_type \n", + "units \n", + "description 818(mmol/L) 1531(mmol/L) \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 NaN NaN \n", + "100003 2150-04-17 19:12:00 NaN NaN \n", + "100006 2108-04-08 10:58:00 NaN NaN \n", + "100007 2145-03-31 00:44:00 NaN NaN \n", + " 2145-04-02 14:10:00 NaN NaN " + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "label = 'lactate'\n", + "df_extract = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n", + "df_cleaned = intro_pipeline.transform(df_extract)\n", + "df_cleaned.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"8\" halign=\"left\">lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " <th colspan=\"4\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th colspan=\"3\" halign=\"left\">nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">mmol/L</th>\n", + " <th>no_units</th>\n", + " <th colspan=\"3\" halign=\"left\">no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>50813</th>\n", + " <th>225668</th>\n", + " <th>818</th>\n", + " <th>1531</th>\n", + " <th>225668</th>\n", + " <th>50813(mmol/L)</th>\n", + " <th>818(mmol/L)</th>\n", + " <th>1531(mmol/L)</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>176767.000000</td>\n", + " <td>69402.000000</td>\n", + " <td>72916.000000</td>\n", + " <td>63134.000000</td>\n", + " <td>14.000000</td>\n", + " <td>57</td>\n", + " <td>57</td>\n", + " <td>23</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>34</td>\n", + " <td>14</td>\n", + " <td>8</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>ERROR</td>\n", + " <td>no data</td>\n", + " <td>no data</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>18</td>\n", + " <td>37</td>\n", + " <td>9</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>2.635120</td>\n", + " <td>16.943607</td>\n", + " <td>2.849300</td>\n", + " <td>2.780338</td>\n", + " <td>52.835714</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>2.590268</td>\n", + " <td>3795.881233</td>\n", + " <td>3.152031</td>\n", + " <td>3.045527</td>\n", + " <td>82.567153</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>0.050000</td>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>1.200000</td>\n", + " <td>1.200000</td>\n", + " <td>1.200000</td>\n", + " <td>1.200000</td>\n", + " <td>1.175000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>1.800000</td>\n", + " <td>1.800000</td>\n", + " <td>1.800000</td>\n", + " <td>1.800000</td>\n", + " <td>3.400000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>2.900000</td>\n", + " <td>2.900000</td>\n", + " <td>3.100000</td>\n", + " <td>3.000000</td>\n", + " <td>115.400000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>36.000000</td>\n", + " <td>999999.000000</td>\n", + " <td>153.000000</td>\n", + " <td>153.000000</td>\n", + " <td>203.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label lactate \\\n", + "status known \n", + "variable_type qn \n", + "units mmol/L \n", + "description 50813 225668 818 1531 \n", + "count 176767.000000 69402.000000 72916.000000 63134.000000 \n", + "unique NaN NaN NaN NaN \n", + "top NaN NaN NaN NaN \n", + "freq NaN NaN NaN NaN \n", + "mean 2.635120 16.943607 2.849300 2.780338 \n", + "std 2.590268 3795.881233 3.152031 3.045527 \n", + "min 0.000000 0.050000 0.000000 0.000000 \n", + "25% 1.200000 1.200000 1.200000 1.200000 \n", + "50% 1.800000 1.800000 1.800000 1.800000 \n", + "75% 2.900000 2.900000 3.100000 3.000000 \n", + "max 36.000000 999999.000000 153.000000 153.000000 \n", + "\n", + "label \n", + "status unknown \n", + "variable_type qn nom \n", + "units no_units no_units \n", + "description 225668 50813(mmol/L) 818(mmol/L) 1531(mmol/L) \n", + "count 14.000000 57 57 23 \n", + "unique NaN 34 14 8 \n", + "top NaN ERROR no data no data \n", + "freq NaN 18 37 9 \n", + "mean 52.835714 NaN NaN NaN \n", + "std 82.567153 NaN NaN NaN \n", + "min 0.000000 NaN NaN NaN \n", + "25% 1.175000 NaN NaN NaN \n", + "50% 3.400000 NaN NaN NaN \n", + "75% 115.400000 NaN NaN NaN \n", + "max 203.000000 NaN NaN NaN " + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_cleaned.describe(include='all')" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"21\" halign=\"left\">lactate</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " <th colspan=\"17\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " <th>qn</th>\n", + " <th colspan=\"16\" halign=\"left\">nom</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">mmol/L</th>\n", + " <th>no_units</th>\n", + " <th colspan=\"16\" halign=\"left\">no_units</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>50813</th>\n", + " <th>225668</th>\n", + " <th>818</th>\n", + " <th>1531</th>\n", + " <th>225668</th>\n", + " <th>50813(mmol/L)_.</th>\n", + " <th>50813(mmol/L)_5,0</th>\n", + " <th>50813(mmol/L)_>30</th>\n", + " <th>50813(mmol/L)_>30.0</th>\n", + " <th>50813(mmol/L)_CLOTTED</th>\n", + " <th>...</th>\n", + " <th>818(mmol/L)_VOIDED</th>\n", + " <th>818(mmol/L)_no data</th>\n", + " <th>1531(mmol/L)_.</th>\n", + " <th>1531(mmol/L)_5,0</th>\n", + " <th>1531(mmol/L)_>30</th>\n", + " <th>1531(mmol/L)_>30.0</th>\n", + " <th>1531(mmol/L)_CLOTTED</th>\n", + " <th>1531(mmol/L)_ERROR</th>\n", + " <th>1531(mmol/L)_VOIDED</th>\n", + " <th>1531(mmol/L)_no data</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>100001</th>\n", + " <th>2117-09-11 09:32:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100003</th>\n", + " <th>2150-04-17 19:12:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100006</th>\n", + " <th>2108-04-08 10:58:00</th>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>4.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100007</th>\n", + " <th>2145-03-31 00:44:00</th>\n", + " <td>3.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2145-04-02 14:10:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100009</th>\n", + " <th>2162-05-17 13:19:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2162-05-17 17:14:00</th>\n", + " <td>1.5</td>\n", + " <td>1.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">100010</th>\n", + " <th>2109-12-10 10:25:00</th>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 12:11:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:05:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-10 13:58:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100011</th>\n", + " <th>2177-08-29 04:44:00</th>\n", + " <td>3.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-08-29 06:55:00</th>\n", + " <td>2.3</td>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100012</th>\n", + " <th>2177-03-14 07:38:00</th>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-14 11:42:00</th>\n", + " <td>2.5</td>\n", + " <td>2.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 08:05:00</th>\n", + " <td>2.1</td>\n", + " <td>2.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 14:01:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-03-15 21:42:00</th>\n", + " <td>1.8</td>\n", + " <td>1.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100016</th>\n", + " <th>2188-05-24 12:00:00</th>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100017</th>\n", + " <th>2103-03-11 05:10:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">100018</th>\n", + " <th>2176-08-29 15:29:00</th>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 09:23:00</th>\n", + " <td>0.9</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 10:19:00</th>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 11:29:00</th>\n", + " <td>0.9</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2176-08-30 12:40:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100020</th>\n", + " <th>2142-11-30 21:54:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2142-12-03 00:17:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100024</th>\n", + " <th>2170-09-19 10:25:00</th>\n", + " <td>1.4</td>\n", + " <td>1.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-19 16:33:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2170-09-20 02:04:00</th>\n", + " <td>3.2</td>\n", + " <td>3.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199976</th>\n", + " <th>2182-02-14 11:15:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-16 03:57:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-19 03:59:00</th>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>0.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-20 03:31:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-21 04:55:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199979</th>\n", + " <th>2182-02-06 09:17:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2182-02-06 14:16:00</th>\n", + " <td>3.8</td>\n", + " <td>3.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">199981</th>\n", + " <th>2110-09-24 16:34:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-24 20:09:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2110-09-25 06:10:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>199987</th>\n", + " <th>2175-05-19 16:30:00</th>\n", + " <td>2.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"6\" valign=\"top\">199988</th>\n", + " <th>2169-01-24 12:48:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 01:35:00</th>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>1.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 11:18:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 16:43:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-07 22:35:00</th>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2169-02-10 05:33:00</th>\n", + " <td>1.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199993</th>\n", + " <th>2161-11-12 23:14:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2161-11-13 03:46:00</th>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>0.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"4\" valign=\"top\">199994</th>\n", + " <th>2188-07-07 21:23:00</th>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 03:09:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 04:13:00</th>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>0.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2188-07-08 06:20:00</th>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>0.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"5\" valign=\"top\">199998</th>\n", + " <th>2119-02-20 10:52:00</th>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>1.1</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 12:36:00</th>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:33:00</th>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 13:59:00</th>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>2.6</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 20:43:00</th>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>1.3</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">199999</th>\n", + " <th>2136-04-04 20:55:00</th>\n", + " <td>1.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-06 15:29:00</th>\n", + " <td>1.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>...</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " <td>0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>177450 rows × 29 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label lactate \\\n", + "status known unknown \n", + "variable_type qn qn nom \n", + "units mmol/L no_units no_units \n", + "description 50813 225668 818 1531 225668 50813(mmol/L)_. \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 1.9 NaN NaN NaN NaN 0 \n", + "100003 2150-04-17 19:12:00 1.1 1.1 NaN NaN NaN 0 \n", + "100006 2108-04-08 10:58:00 4.5 NaN 4.5 NaN NaN 0 \n", + "100007 2145-03-31 00:44:00 3.1 NaN NaN NaN NaN 0 \n", + " 2145-04-02 14:10:00 1.9 NaN NaN NaN NaN 0 \n", + "100009 2162-05-17 13:19:00 1.1 1.1 NaN NaN NaN 0 \n", + " 2162-05-17 17:14:00 1.5 1.5 NaN NaN NaN 0 \n", + "100010 2109-12-10 10:25:00 0.6 NaN NaN NaN NaN 0 \n", + " 2109-12-10 12:11:00 0.9 NaN NaN NaN NaN 0 \n", + " 2109-12-10 13:05:00 1.0 NaN NaN NaN NaN 0 \n", + " 2109-12-10 13:58:00 0.8 NaN NaN NaN NaN 0 \n", + "100011 2177-08-29 04:44:00 3.8 NaN NaN NaN NaN 0 \n", + " 2177-08-29 06:55:00 2.3 2.3 NaN NaN NaN 0 \n", + "100012 2177-03-14 07:38:00 2.3 NaN NaN NaN NaN 0 \n", + " 2177-03-14 11:42:00 2.5 2.5 NaN NaN NaN 0 \n", + " 2177-03-15 08:05:00 2.1 2.1 NaN NaN NaN 0 \n", + " 2177-03-15 14:01:00 2.6 2.6 NaN NaN NaN 0 \n", + " 2177-03-15 21:42:00 1.8 1.8 NaN NaN NaN 0 \n", + "100016 2188-05-24 12:00:00 2.0 NaN NaN NaN NaN 0 \n", + "100017 2103-03-11 05:10:00 1.1 NaN 1.1 NaN NaN 0 \n", + "100018 2176-08-29 15:29:00 1.3 NaN NaN NaN NaN 0 \n", + " 2176-08-30 09:23:00 0.9 0.9 NaN NaN NaN 0 \n", + " 2176-08-30 10:19:00 1.0 1.0 NaN NaN NaN 0 \n", + " 2176-08-30 11:29:00 0.9 0.9 NaN NaN NaN 0 \n", + " 2176-08-30 12:40:00 1.1 1.1 NaN NaN NaN 0 \n", + "100020 2142-11-30 21:54:00 1.1 NaN NaN NaN NaN 0 \n", + " 2142-12-03 00:17:00 1.0 NaN NaN NaN NaN 0 \n", + "100024 2170-09-19 10:25:00 1.4 1.4 NaN NaN NaN 0 \n", + " 2170-09-19 16:33:00 2.6 2.6 NaN NaN NaN 0 \n", + " 2170-09-20 02:04:00 3.2 3.2 NaN NaN NaN 0 \n", + "... ... ... ... ... ... ... \n", + "199976 2182-02-14 11:15:00 0.8 NaN 0.8 NaN NaN 0 \n", + " 2182-02-16 03:57:00 0.8 NaN 0.8 NaN NaN 0 \n", + " 2182-02-19 03:59:00 0.8 NaN 0.8 NaN NaN 0 \n", + " 2182-02-20 03:31:00 0.7 NaN 0.7 NaN NaN 0 \n", + " 2182-02-21 04:55:00 0.9 NaN 0.9 NaN NaN 0 \n", + "199979 2182-02-06 09:17:00 1.0 NaN NaN NaN NaN 0 \n", + " 2182-02-06 14:16:00 3.8 3.8 NaN NaN NaN 0 \n", + "199981 2110-09-24 16:34:00 1.1 NaN 1.1 1.1 NaN 0 \n", + " 2110-09-24 20:09:00 1.0 NaN 1.0 1.0 NaN 0 \n", + " 2110-09-25 06:10:00 1.0 NaN 1.0 1.0 NaN 0 \n", + "199987 2175-05-19 16:30:00 2.3 NaN NaN NaN NaN 0 \n", + "199988 2169-01-24 12:48:00 1.0 NaN NaN NaN NaN 0 \n", + " 2169-02-07 01:35:00 1.6 NaN 1.6 NaN NaN 0 \n", + " 2169-02-07 11:18:00 1.0 NaN 1.0 NaN NaN 0 \n", + " 2169-02-07 16:43:00 1.0 NaN 1.0 NaN NaN 0 \n", + " 2169-02-07 22:35:00 1.1 NaN 1.1 NaN NaN 0 \n", + " 2169-02-10 05:33:00 1.4 NaN NaN NaN NaN 0 \n", + "199993 2161-11-12 23:14:00 0.9 NaN 0.9 NaN NaN 0 \n", + " 2161-11-13 03:46:00 0.9 NaN 0.9 NaN NaN 0 \n", + "199994 2188-07-07 21:23:00 1.0 NaN 1.0 NaN NaN 0 \n", + " 2188-07-08 03:09:00 0.7 NaN 0.7 NaN NaN 0 \n", + " 2188-07-08 04:13:00 0.6 NaN 0.6 NaN NaN 0 \n", + " 2188-07-08 06:20:00 0.7 NaN 0.7 NaN NaN 0 \n", + "199998 2119-02-20 10:52:00 1.1 1.1 1.1 1.1 NaN 0 \n", + " 2119-02-20 12:36:00 1.9 1.9 1.9 1.9 NaN 0 \n", + " 2119-02-20 13:33:00 2.0 2.0 2.0 2.0 NaN 0 \n", + " 2119-02-20 13:59:00 2.6 2.6 2.6 2.6 NaN 0 \n", + " 2119-02-20 20:43:00 1.3 1.3 1.3 1.3 NaN 0 \n", + "199999 2136-04-04 20:55:00 1.9 NaN NaN NaN NaN 0 \n", + " 2136-04-06 15:29:00 1.8 NaN NaN NaN NaN 0 \n", + "\n", + "label \\\n", + "status \n", + "variable_type \n", + "units \n", + "description 50813(mmol/L)_5,0 50813(mmol/L)_>30 \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 0 \n", + "100003 2150-04-17 19:12:00 0 0 \n", + "100006 2108-04-08 10:58:00 0 0 \n", + "100007 2145-03-31 00:44:00 0 0 \n", + " 2145-04-02 14:10:00 0 0 \n", + "100009 2162-05-17 13:19:00 0 0 \n", + " 2162-05-17 17:14:00 0 0 \n", + "100010 2109-12-10 10:25:00 0 0 \n", + " 2109-12-10 12:11:00 0 0 \n", + " 2109-12-10 13:05:00 0 0 \n", + " 2109-12-10 13:58:00 0 0 \n", + "100011 2177-08-29 04:44:00 0 0 \n", + " 2177-08-29 06:55:00 0 0 \n", + "100012 2177-03-14 07:38:00 0 0 \n", + " 2177-03-14 11:42:00 0 0 \n", + " 2177-03-15 08:05:00 0 0 \n", + " 2177-03-15 14:01:00 0 0 \n", + " 2177-03-15 21:42:00 0 0 \n", + "100016 2188-05-24 12:00:00 0 0 \n", + "100017 2103-03-11 05:10:00 0 0 \n", + "100018 2176-08-29 15:29:00 0 0 \n", + " 2176-08-30 09:23:00 0 0 \n", + " 2176-08-30 10:19:00 0 0 \n", + " 2176-08-30 11:29:00 0 0 \n", + " 2176-08-30 12:40:00 0 0 \n", + "100020 2142-11-30 21:54:00 0 0 \n", + " 2142-12-03 00:17:00 0 0 \n", + "100024 2170-09-19 10:25:00 0 0 \n", + " 2170-09-19 16:33:00 0 0 \n", + " 2170-09-20 02:04:00 0 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 0 0 \n", + " 2182-02-16 03:57:00 0 0 \n", + " 2182-02-19 03:59:00 0 0 \n", + " 2182-02-20 03:31:00 0 0 \n", + " 2182-02-21 04:55:00 0 0 \n", + "199979 2182-02-06 09:17:00 0 0 \n", + " 2182-02-06 14:16:00 0 0 \n", + "199981 2110-09-24 16:34:00 0 0 \n", + " 2110-09-24 20:09:00 0 0 \n", + " 2110-09-25 06:10:00 0 0 \n", + "199987 2175-05-19 16:30:00 0 0 \n", + "199988 2169-01-24 12:48:00 0 0 \n", + " 2169-02-07 01:35:00 0 0 \n", + " 2169-02-07 11:18:00 0 0 \n", + " 2169-02-07 16:43:00 0 0 \n", + " 2169-02-07 22:35:00 0 0 \n", + " 2169-02-10 05:33:00 0 0 \n", + "199993 2161-11-12 23:14:00 0 0 \n", + " 2161-11-13 03:46:00 0 0 \n", + "199994 2188-07-07 21:23:00 0 0 \n", + " 2188-07-08 03:09:00 0 0 \n", + " 2188-07-08 04:13:00 0 0 \n", + " 2188-07-08 06:20:00 0 0 \n", + "199998 2119-02-20 10:52:00 0 0 \n", + " 2119-02-20 12:36:00 0 0 \n", + " 2119-02-20 13:33:00 0 0 \n", + " 2119-02-20 13:59:00 0 0 \n", + " 2119-02-20 20:43:00 0 0 \n", + "199999 2136-04-04 20:55:00 0 0 \n", + " 2136-04-06 15:29:00 0 0 \n", + "\n", + "label \\\n", + "status \n", + "variable_type \n", + "units \n", + "description 50813(mmol/L)_>30.0 50813(mmol/L)_CLOTTED \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 0 \n", + "100003 2150-04-17 19:12:00 0 0 \n", + "100006 2108-04-08 10:58:00 0 0 \n", + "100007 2145-03-31 00:44:00 0 0 \n", + " 2145-04-02 14:10:00 0 0 \n", + "100009 2162-05-17 13:19:00 0 0 \n", + " 2162-05-17 17:14:00 0 0 \n", + "100010 2109-12-10 10:25:00 0 0 \n", + " 2109-12-10 12:11:00 0 0 \n", + " 2109-12-10 13:05:00 0 0 \n", + " 2109-12-10 13:58:00 0 0 \n", + "100011 2177-08-29 04:44:00 0 0 \n", + " 2177-08-29 06:55:00 0 0 \n", + "100012 2177-03-14 07:38:00 0 0 \n", + " 2177-03-14 11:42:00 0 0 \n", + " 2177-03-15 08:05:00 0 0 \n", + " 2177-03-15 14:01:00 0 0 \n", + " 2177-03-15 21:42:00 0 0 \n", + "100016 2188-05-24 12:00:00 0 0 \n", + "100017 2103-03-11 05:10:00 0 0 \n", + "100018 2176-08-29 15:29:00 0 0 \n", + " 2176-08-30 09:23:00 0 0 \n", + " 2176-08-30 10:19:00 0 0 \n", + " 2176-08-30 11:29:00 0 0 \n", + " 2176-08-30 12:40:00 0 0 \n", + "100020 2142-11-30 21:54:00 0 0 \n", + " 2142-12-03 00:17:00 0 0 \n", + "100024 2170-09-19 10:25:00 0 0 \n", + " 2170-09-19 16:33:00 0 0 \n", + " 2170-09-20 02:04:00 0 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 0 0 \n", + " 2182-02-16 03:57:00 0 0 \n", + " 2182-02-19 03:59:00 0 0 \n", + " 2182-02-20 03:31:00 0 0 \n", + " 2182-02-21 04:55:00 0 0 \n", + "199979 2182-02-06 09:17:00 0 0 \n", + " 2182-02-06 14:16:00 0 0 \n", + "199981 2110-09-24 16:34:00 0 0 \n", + " 2110-09-24 20:09:00 0 0 \n", + " 2110-09-25 06:10:00 0 0 \n", + "199987 2175-05-19 16:30:00 0 0 \n", + "199988 2169-01-24 12:48:00 0 0 \n", + " 2169-02-07 01:35:00 0 0 \n", + " 2169-02-07 11:18:00 0 0 \n", + " 2169-02-07 16:43:00 0 0 \n", + " 2169-02-07 22:35:00 0 0 \n", + " 2169-02-10 05:33:00 0 0 \n", + "199993 2161-11-12 23:14:00 0 0 \n", + " 2161-11-13 03:46:00 0 0 \n", + "199994 2188-07-07 21:23:00 0 0 \n", + " 2188-07-08 03:09:00 0 0 \n", + " 2188-07-08 04:13:00 0 0 \n", + " 2188-07-08 06:20:00 0 0 \n", + "199998 2119-02-20 10:52:00 0 0 \n", + " 2119-02-20 12:36:00 0 0 \n", + " 2119-02-20 13:33:00 0 0 \n", + " 2119-02-20 13:59:00 0 0 \n", + " 2119-02-20 20:43:00 0 0 \n", + "199999 2136-04-04 20:55:00 0 0 \n", + " 2136-04-06 15:29:00 0 0 \n", + "\n", + "label ... \\\n", + "status ... \n", + "variable_type ... \n", + "units ... \n", + "description ... 818(mmol/L)_VOIDED \n", + "id datetime ... \n", + "100001 2117-09-11 09:32:00 ... 0 \n", + "100003 2150-04-17 19:12:00 ... 0 \n", + "100006 2108-04-08 10:58:00 ... 0 \n", + "100007 2145-03-31 00:44:00 ... 0 \n", + " 2145-04-02 14:10:00 ... 0 \n", + "100009 2162-05-17 13:19:00 ... 0 \n", + " 2162-05-17 17:14:00 ... 0 \n", + "100010 2109-12-10 10:25:00 ... 0 \n", + " 2109-12-10 12:11:00 ... 0 \n", + " 2109-12-10 13:05:00 ... 0 \n", + " 2109-12-10 13:58:00 ... 0 \n", + "100011 2177-08-29 04:44:00 ... 0 \n", + " 2177-08-29 06:55:00 ... 0 \n", + "100012 2177-03-14 07:38:00 ... 0 \n", + " 2177-03-14 11:42:00 ... 0 \n", + " 2177-03-15 08:05:00 ... 0 \n", + " 2177-03-15 14:01:00 ... 0 \n", + " 2177-03-15 21:42:00 ... 0 \n", + "100016 2188-05-24 12:00:00 ... 0 \n", + "100017 2103-03-11 05:10:00 ... 0 \n", + "100018 2176-08-29 15:29:00 ... 0 \n", + " 2176-08-30 09:23:00 ... 0 \n", + " 2176-08-30 10:19:00 ... 0 \n", + " 2176-08-30 11:29:00 ... 0 \n", + " 2176-08-30 12:40:00 ... 0 \n", + "100020 2142-11-30 21:54:00 ... 0 \n", + " 2142-12-03 00:17:00 ... 0 \n", + "100024 2170-09-19 10:25:00 ... 0 \n", + " 2170-09-19 16:33:00 ... 0 \n", + " 2170-09-20 02:04:00 ... 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 ... 0 \n", + " 2182-02-16 03:57:00 ... 0 \n", + " 2182-02-19 03:59:00 ... 0 \n", + " 2182-02-20 03:31:00 ... 0 \n", + " 2182-02-21 04:55:00 ... 0 \n", + "199979 2182-02-06 09:17:00 ... 0 \n", + " 2182-02-06 14:16:00 ... 0 \n", + "199981 2110-09-24 16:34:00 ... 0 \n", + " 2110-09-24 20:09:00 ... 0 \n", + " 2110-09-25 06:10:00 ... 0 \n", + "199987 2175-05-19 16:30:00 ... 0 \n", + "199988 2169-01-24 12:48:00 ... 0 \n", + " 2169-02-07 01:35:00 ... 0 \n", + " 2169-02-07 11:18:00 ... 0 \n", + " 2169-02-07 16:43:00 ... 0 \n", + " 2169-02-07 22:35:00 ... 0 \n", + " 2169-02-10 05:33:00 ... 0 \n", + "199993 2161-11-12 23:14:00 ... 0 \n", + " 2161-11-13 03:46:00 ... 0 \n", + "199994 2188-07-07 21:23:00 ... 0 \n", + " 2188-07-08 03:09:00 ... 0 \n", + " 2188-07-08 04:13:00 ... 0 \n", + " 2188-07-08 06:20:00 ... 0 \n", + "199998 2119-02-20 10:52:00 ... 0 \n", + " 2119-02-20 12:36:00 ... 0 \n", + " 2119-02-20 13:33:00 ... 0 \n", + " 2119-02-20 13:59:00 ... 0 \n", + " 2119-02-20 20:43:00 ... 0 \n", + "199999 2136-04-04 20:55:00 ... 0 \n", + " 2136-04-06 15:29:00 ... 0 \n", + "\n", + "label \\\n", + "status \n", + "variable_type \n", + "units \n", + "description 818(mmol/L)_no data 1531(mmol/L)_. \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 0 \n", + "100003 2150-04-17 19:12:00 0 0 \n", + "100006 2108-04-08 10:58:00 0 0 \n", + "100007 2145-03-31 00:44:00 0 0 \n", + " 2145-04-02 14:10:00 0 0 \n", + "100009 2162-05-17 13:19:00 0 0 \n", + " 2162-05-17 17:14:00 0 0 \n", + "100010 2109-12-10 10:25:00 0 0 \n", + " 2109-12-10 12:11:00 0 0 \n", + " 2109-12-10 13:05:00 0 0 \n", + " 2109-12-10 13:58:00 0 0 \n", + "100011 2177-08-29 04:44:00 0 0 \n", + " 2177-08-29 06:55:00 0 0 \n", + "100012 2177-03-14 07:38:00 0 0 \n", + " 2177-03-14 11:42:00 0 0 \n", + " 2177-03-15 08:05:00 0 0 \n", + " 2177-03-15 14:01:00 0 0 \n", + " 2177-03-15 21:42:00 0 0 \n", + "100016 2188-05-24 12:00:00 0 0 \n", + "100017 2103-03-11 05:10:00 0 0 \n", + "100018 2176-08-29 15:29:00 0 0 \n", + " 2176-08-30 09:23:00 0 0 \n", + " 2176-08-30 10:19:00 0 0 \n", + " 2176-08-30 11:29:00 0 0 \n", + " 2176-08-30 12:40:00 0 0 \n", + "100020 2142-11-30 21:54:00 0 0 \n", + " 2142-12-03 00:17:00 0 0 \n", + "100024 2170-09-19 10:25:00 0 0 \n", + " 2170-09-19 16:33:00 0 0 \n", + " 2170-09-20 02:04:00 0 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 0 0 \n", + " 2182-02-16 03:57:00 0 0 \n", + " 2182-02-19 03:59:00 0 0 \n", + " 2182-02-20 03:31:00 0 0 \n", + " 2182-02-21 04:55:00 0 0 \n", + "199979 2182-02-06 09:17:00 0 0 \n", + " 2182-02-06 14:16:00 0 0 \n", + "199981 2110-09-24 16:34:00 0 0 \n", + " 2110-09-24 20:09:00 0 0 \n", + " 2110-09-25 06:10:00 0 0 \n", + "199987 2175-05-19 16:30:00 0 0 \n", + "199988 2169-01-24 12:48:00 0 0 \n", + " 2169-02-07 01:35:00 0 0 \n", + " 2169-02-07 11:18:00 0 0 \n", + " 2169-02-07 16:43:00 0 0 \n", + " 2169-02-07 22:35:00 0 0 \n", + " 2169-02-10 05:33:00 0 0 \n", + "199993 2161-11-12 23:14:00 0 0 \n", + " 2161-11-13 03:46:00 0 0 \n", + "199994 2188-07-07 21:23:00 0 0 \n", + " 2188-07-08 03:09:00 0 0 \n", + " 2188-07-08 04:13:00 0 0 \n", + " 2188-07-08 06:20:00 0 0 \n", + "199998 2119-02-20 10:52:00 0 0 \n", + " 2119-02-20 12:36:00 0 0 \n", + " 2119-02-20 13:33:00 0 0 \n", + " 2119-02-20 13:59:00 0 0 \n", + " 2119-02-20 20:43:00 0 0 \n", + "199999 2136-04-04 20:55:00 0 0 \n", + " 2136-04-06 15:29:00 0 0 \n", + "\n", + "label \\\n", + "status \n", + "variable_type \n", + "units \n", + "description 1531(mmol/L)_5,0 1531(mmol/L)_>30 \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 0 \n", + "100003 2150-04-17 19:12:00 0 0 \n", + "100006 2108-04-08 10:58:00 0 0 \n", + "100007 2145-03-31 00:44:00 0 0 \n", + " 2145-04-02 14:10:00 0 0 \n", + "100009 2162-05-17 13:19:00 0 0 \n", + " 2162-05-17 17:14:00 0 0 \n", + "100010 2109-12-10 10:25:00 0 0 \n", + " 2109-12-10 12:11:00 0 0 \n", + " 2109-12-10 13:05:00 0 0 \n", + " 2109-12-10 13:58:00 0 0 \n", + "100011 2177-08-29 04:44:00 0 0 \n", + " 2177-08-29 06:55:00 0 0 \n", + "100012 2177-03-14 07:38:00 0 0 \n", + " 2177-03-14 11:42:00 0 0 \n", + " 2177-03-15 08:05:00 0 0 \n", + " 2177-03-15 14:01:00 0 0 \n", + " 2177-03-15 21:42:00 0 0 \n", + "100016 2188-05-24 12:00:00 0 0 \n", + "100017 2103-03-11 05:10:00 0 0 \n", + "100018 2176-08-29 15:29:00 0 0 \n", + " 2176-08-30 09:23:00 0 0 \n", + " 2176-08-30 10:19:00 0 0 \n", + " 2176-08-30 11:29:00 0 0 \n", + " 2176-08-30 12:40:00 0 0 \n", + "100020 2142-11-30 21:54:00 0 0 \n", + " 2142-12-03 00:17:00 0 0 \n", + "100024 2170-09-19 10:25:00 0 0 \n", + " 2170-09-19 16:33:00 0 0 \n", + " 2170-09-20 02:04:00 0 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 0 0 \n", + " 2182-02-16 03:57:00 0 0 \n", + " 2182-02-19 03:59:00 0 0 \n", + " 2182-02-20 03:31:00 0 0 \n", + " 2182-02-21 04:55:00 0 0 \n", + "199979 2182-02-06 09:17:00 0 0 \n", + " 2182-02-06 14:16:00 0 0 \n", + "199981 2110-09-24 16:34:00 0 0 \n", + " 2110-09-24 20:09:00 0 0 \n", + " 2110-09-25 06:10:00 0 0 \n", + "199987 2175-05-19 16:30:00 0 0 \n", + "199988 2169-01-24 12:48:00 0 0 \n", + " 2169-02-07 01:35:00 0 0 \n", + " 2169-02-07 11:18:00 0 0 \n", + " 2169-02-07 16:43:00 0 0 \n", + " 2169-02-07 22:35:00 0 0 \n", + " 2169-02-10 05:33:00 0 0 \n", + "199993 2161-11-12 23:14:00 0 0 \n", + " 2161-11-13 03:46:00 0 0 \n", + "199994 2188-07-07 21:23:00 0 0 \n", + " 2188-07-08 03:09:00 0 0 \n", + " 2188-07-08 04:13:00 0 0 \n", + " 2188-07-08 06:20:00 0 0 \n", + "199998 2119-02-20 10:52:00 0 0 \n", + " 2119-02-20 12:36:00 0 0 \n", + " 2119-02-20 13:33:00 0 0 \n", + " 2119-02-20 13:59:00 0 0 \n", + " 2119-02-20 20:43:00 0 0 \n", + "199999 2136-04-04 20:55:00 0 0 \n", + " 2136-04-06 15:29:00 0 0 \n", + "\n", + "label \\\n", + "status \n", + "variable_type \n", + "units \n", + "description 1531(mmol/L)_>30.0 1531(mmol/L)_CLOTTED \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 0 \n", + "100003 2150-04-17 19:12:00 0 0 \n", + "100006 2108-04-08 10:58:00 0 0 \n", + "100007 2145-03-31 00:44:00 0 0 \n", + " 2145-04-02 14:10:00 0 0 \n", + "100009 2162-05-17 13:19:00 0 0 \n", + " 2162-05-17 17:14:00 0 0 \n", + "100010 2109-12-10 10:25:00 0 0 \n", + " 2109-12-10 12:11:00 0 0 \n", + " 2109-12-10 13:05:00 0 0 \n", + " 2109-12-10 13:58:00 0 0 \n", + "100011 2177-08-29 04:44:00 0 0 \n", + " 2177-08-29 06:55:00 0 0 \n", + "100012 2177-03-14 07:38:00 0 0 \n", + " 2177-03-14 11:42:00 0 0 \n", + " 2177-03-15 08:05:00 0 0 \n", + " 2177-03-15 14:01:00 0 0 \n", + " 2177-03-15 21:42:00 0 0 \n", + "100016 2188-05-24 12:00:00 0 0 \n", + "100017 2103-03-11 05:10:00 0 0 \n", + "100018 2176-08-29 15:29:00 0 0 \n", + " 2176-08-30 09:23:00 0 0 \n", + " 2176-08-30 10:19:00 0 0 \n", + " 2176-08-30 11:29:00 0 0 \n", + " 2176-08-30 12:40:00 0 0 \n", + "100020 2142-11-30 21:54:00 0 0 \n", + " 2142-12-03 00:17:00 0 0 \n", + "100024 2170-09-19 10:25:00 0 0 \n", + " 2170-09-19 16:33:00 0 0 \n", + " 2170-09-20 02:04:00 0 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 0 0 \n", + " 2182-02-16 03:57:00 0 0 \n", + " 2182-02-19 03:59:00 0 0 \n", + " 2182-02-20 03:31:00 0 0 \n", + " 2182-02-21 04:55:00 0 0 \n", + "199979 2182-02-06 09:17:00 0 0 \n", + " 2182-02-06 14:16:00 0 0 \n", + "199981 2110-09-24 16:34:00 0 0 \n", + " 2110-09-24 20:09:00 0 0 \n", + " 2110-09-25 06:10:00 0 0 \n", + "199987 2175-05-19 16:30:00 0 0 \n", + "199988 2169-01-24 12:48:00 0 0 \n", + " 2169-02-07 01:35:00 0 0 \n", + " 2169-02-07 11:18:00 0 0 \n", + " 2169-02-07 16:43:00 0 0 \n", + " 2169-02-07 22:35:00 0 0 \n", + " 2169-02-10 05:33:00 0 0 \n", + "199993 2161-11-12 23:14:00 0 0 \n", + " 2161-11-13 03:46:00 0 0 \n", + "199994 2188-07-07 21:23:00 0 0 \n", + " 2188-07-08 03:09:00 0 0 \n", + " 2188-07-08 04:13:00 0 0 \n", + " 2188-07-08 06:20:00 0 0 \n", + "199998 2119-02-20 10:52:00 0 0 \n", + " 2119-02-20 12:36:00 0 0 \n", + " 2119-02-20 13:33:00 0 0 \n", + " 2119-02-20 13:59:00 0 0 \n", + " 2119-02-20 20:43:00 0 0 \n", + "199999 2136-04-04 20:55:00 0 0 \n", + " 2136-04-06 15:29:00 0 0 \n", + "\n", + "label \\\n", + "status \n", + "variable_type \n", + "units \n", + "description 1531(mmol/L)_ERROR 1531(mmol/L)_VOIDED \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 0 \n", + "100003 2150-04-17 19:12:00 0 0 \n", + "100006 2108-04-08 10:58:00 0 0 \n", + "100007 2145-03-31 00:44:00 0 0 \n", + " 2145-04-02 14:10:00 0 0 \n", + "100009 2162-05-17 13:19:00 0 0 \n", + " 2162-05-17 17:14:00 0 0 \n", + "100010 2109-12-10 10:25:00 0 0 \n", + " 2109-12-10 12:11:00 0 0 \n", + " 2109-12-10 13:05:00 0 0 \n", + " 2109-12-10 13:58:00 0 0 \n", + "100011 2177-08-29 04:44:00 0 0 \n", + " 2177-08-29 06:55:00 0 0 \n", + "100012 2177-03-14 07:38:00 0 0 \n", + " 2177-03-14 11:42:00 0 0 \n", + " 2177-03-15 08:05:00 0 0 \n", + " 2177-03-15 14:01:00 0 0 \n", + " 2177-03-15 21:42:00 0 0 \n", + "100016 2188-05-24 12:00:00 0 0 \n", + "100017 2103-03-11 05:10:00 0 0 \n", + "100018 2176-08-29 15:29:00 0 0 \n", + " 2176-08-30 09:23:00 0 0 \n", + " 2176-08-30 10:19:00 0 0 \n", + " 2176-08-30 11:29:00 0 0 \n", + " 2176-08-30 12:40:00 0 0 \n", + "100020 2142-11-30 21:54:00 0 0 \n", + " 2142-12-03 00:17:00 0 0 \n", + "100024 2170-09-19 10:25:00 0 0 \n", + " 2170-09-19 16:33:00 0 0 \n", + " 2170-09-20 02:04:00 0 0 \n", + "... ... ... \n", + "199976 2182-02-14 11:15:00 0 0 \n", + " 2182-02-16 03:57:00 0 0 \n", + " 2182-02-19 03:59:00 0 0 \n", + " 2182-02-20 03:31:00 0 0 \n", + " 2182-02-21 04:55:00 0 0 \n", + "199979 2182-02-06 09:17:00 0 0 \n", + " 2182-02-06 14:16:00 0 0 \n", + "199981 2110-09-24 16:34:00 0 0 \n", + " 2110-09-24 20:09:00 0 0 \n", + " 2110-09-25 06:10:00 0 0 \n", + "199987 2175-05-19 16:30:00 0 0 \n", + "199988 2169-01-24 12:48:00 0 0 \n", + " 2169-02-07 01:35:00 0 0 \n", + " 2169-02-07 11:18:00 0 0 \n", + " 2169-02-07 16:43:00 0 0 \n", + " 2169-02-07 22:35:00 0 0 \n", + " 2169-02-10 05:33:00 0 0 \n", + "199993 2161-11-12 23:14:00 0 0 \n", + " 2161-11-13 03:46:00 0 0 \n", + "199994 2188-07-07 21:23:00 0 0 \n", + " 2188-07-08 03:09:00 0 0 \n", + " 2188-07-08 04:13:00 0 0 \n", + " 2188-07-08 06:20:00 0 0 \n", + "199998 2119-02-20 10:52:00 0 0 \n", + " 2119-02-20 12:36:00 0 0 \n", + " 2119-02-20 13:33:00 0 0 \n", + " 2119-02-20 13:59:00 0 0 \n", + " 2119-02-20 20:43:00 0 0 \n", + "199999 2136-04-04 20:55:00 0 0 \n", + " 2136-04-06 15:29:00 0 0 \n", + "\n", + "label \n", + "status \n", + "variable_type \n", + "units \n", + "description 1531(mmol/L)_no data \n", + "id datetime \n", + "100001 2117-09-11 09:32:00 0 \n", + "100003 2150-04-17 19:12:00 0 \n", + "100006 2108-04-08 10:58:00 0 \n", + "100007 2145-03-31 00:44:00 0 \n", + " 2145-04-02 14:10:00 0 \n", + "100009 2162-05-17 13:19:00 0 \n", + " 2162-05-17 17:14:00 0 \n", + "100010 2109-12-10 10:25:00 0 \n", + " 2109-12-10 12:11:00 0 \n", + " 2109-12-10 13:05:00 0 \n", + " 2109-12-10 13:58:00 0 \n", + "100011 2177-08-29 04:44:00 0 \n", + " 2177-08-29 06:55:00 0 \n", + "100012 2177-03-14 07:38:00 0 \n", + " 2177-03-14 11:42:00 0 \n", + " 2177-03-15 08:05:00 0 \n", + " 2177-03-15 14:01:00 0 \n", + " 2177-03-15 21:42:00 0 \n", + "100016 2188-05-24 12:00:00 0 \n", + "100017 2103-03-11 05:10:00 0 \n", + "100018 2176-08-29 15:29:00 0 \n", + " 2176-08-30 09:23:00 0 \n", + " 2176-08-30 10:19:00 0 \n", + " 2176-08-30 11:29:00 0 \n", + " 2176-08-30 12:40:00 0 \n", + "100020 2142-11-30 21:54:00 0 \n", + " 2142-12-03 00:17:00 0 \n", + "100024 2170-09-19 10:25:00 0 \n", + " 2170-09-19 16:33:00 0 \n", + " 2170-09-20 02:04:00 0 \n", + "... ... \n", + "199976 2182-02-14 11:15:00 0 \n", + " 2182-02-16 03:57:00 0 \n", + " 2182-02-19 03:59:00 0 \n", + " 2182-02-20 03:31:00 0 \n", + " 2182-02-21 04:55:00 0 \n", + "199979 2182-02-06 09:17:00 0 \n", + " 2182-02-06 14:16:00 0 \n", + "199981 2110-09-24 16:34:00 0 \n", + " 2110-09-24 20:09:00 0 \n", + " 2110-09-25 06:10:00 0 \n", + "199987 2175-05-19 16:30:00 0 \n", + "199988 2169-01-24 12:48:00 0 \n", + " 2169-02-07 01:35:00 0 \n", + " 2169-02-07 11:18:00 0 \n", + " 2169-02-07 16:43:00 0 \n", + " 2169-02-07 22:35:00 0 \n", + " 2169-02-10 05:33:00 0 \n", + "199993 2161-11-12 23:14:00 0 \n", + " 2161-11-13 03:46:00 0 \n", + "199994 2188-07-07 21:23:00 0 \n", + " 2188-07-08 03:09:00 0 \n", + " 2188-07-08 04:13:00 0 \n", + " 2188-07-08 06:20:00 0 \n", + "199998 2119-02-20 10:52:00 0 \n", + " 2119-02-20 12:36:00 0 \n", + " 2119-02-20 13:33:00 0 \n", + " 2119-02-20 13:59:00 0 \n", + " 2119-02-20 20:43:00 0 \n", + "199999 2136-04-04 20:55:00 0 \n", + " 2136-04-06 15:29:00 0 \n", + "\n", + "[177450 rows x 29 columns]" + ] + }, + "execution_count": 28, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "nominal_cols = df_cleaned.columns.get_level_values('variable_type') == variable_type.NOMINAL\n", + "\n", + "for col_name in df_cleaned.loc[:,nominal_cols]:\n", + " column = df_cleaned[col_nam]\n", + " df_dummies = pd.get_dummies(column)\n", + " dummy_col_names = [col_name[:-1] + ('{}_{}'.format(col_name[-1],text),) for text in df_dummies.columns]\n", + " df_dummies.columns = pd.MultiIndex.from_tuples(dummy_col_names,names=df_cleaned.columns.names)\n", + " \n", + " df_cleaned.drop(col_name,axis=1,inplace=True)\n", + " df_cleaned = df_cleaned.join(df_dummies,how='outer')\n", + "\n", + "df_cleaned" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Possible additional cleaning:\n", + "\n", + "1. Infer UOM \n", + "2. Remove extreme values [DONE]" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "import utils\n", + "import mimic\n", + "import transformers\n", + "from sklearn.pipeline import Pipeline\n", + "import icu_data_defs\n", + "import units" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "df_temp = utils.open_df('data/mimic_data','extract/temperature body')" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(mimic)\n", + "pipeline = mimic.transform_pipeline('temperature body')" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-25 00:00:00</td>\n", + " <td>98.400001525878906</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>188670.0</td>\n", + " <td>2183-08-23 20:00:00</td>\n", + " <td>99.300003051757812</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-12 08:00:00</td>\n", + " <td>98.699996948242188</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-13 17:00:00</td>\n", + " <td>99.900001525878906</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>166707.0</td>\n", + " <td>2122-02-11 20:00:00</td>\n", + " <td>37.900001525878906</td>\n", + " <td>degC</td>\n", + " <td>676</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>166707.0</td>\n", + " <td>2122-02-13 00:00:00</td>\n", + " <td>97.800003051757812</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-11 21:00:00</td>\n", + " <td>99.099998474121094</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-24 04:00:00</td>\n", + " <td>98.900001525878906</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8</th>\n", + " <td>176176.0</td>\n", + " <td>2116-12-24 16:00:00</td>\n", + " <td>99.099998474121094</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>9</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-13 03:00:00</td>\n", + " <td>99.199996948242188</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>10</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-30 18:00:00</td>\n", + " <td>98.800003051757812</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>11</th>\n", + " <td>181750.0</td>\n", + " <td>2192-11-24 08:00:00</td>\n", + " <td>98.5</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>12</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-14 12:00:00</td>\n", + " <td>100.40000152587891</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>13</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-14 13:00:00</td>\n", + " <td>100.69999694824219</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>14</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-15 22:00:00</td>\n", + " <td>99.800003051757812</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>15</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-16 21:00:00</td>\n", + " <td>100.59999847412109</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>16</th>\n", + " <td>185910.0</td>\n", + " <td>2166-08-23 08:00:00</td>\n", + " <td>98</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>17</th>\n", + " <td>190797.0</td>\n", + " <td>2191-01-10 08:00:00</td>\n", + " <td>97.900001525878906</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>18</th>\n", + " <td>157907.0</td>\n", + " <td>2129-06-10 23:00:00</td>\n", + " <td>100.09999847412109</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " <tr>\n", + " <th>19</th>\n", + " <td>157907.0</td>\n", + " <td>2129-06-11 04:30:00</td>\n", + " <td>98.800003051757812</td>\n", + " <td>degF</td>\n", + " <td>678</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 185910.0 2166-08-25 00:00:00 98.400001525878906 degF 678\n", + "1 188670.0 2183-08-23 20:00:00 99.300003051757812 degF 678\n", + "2 185910.0 2166-08-12 08:00:00 98.699996948242188 degF 678\n", + "3 185910.0 2166-08-13 17:00:00 99.900001525878906 degF 678\n", + "4 166707.0 2122-02-11 20:00:00 37.900001525878906 degC 676\n", + "5 166707.0 2122-02-13 00:00:00 97.800003051757812 degF 678\n", + "6 185910.0 2166-08-11 21:00:00 99.099998474121094 degF 678\n", + "7 185910.0 2166-08-24 04:00:00 98.900001525878906 degF 678\n", + "8 176176.0 2116-12-24 16:00:00 99.099998474121094 degF 678\n", + "9 185910.0 2166-08-13 03:00:00 99.199996948242188 degF 678\n", + "10 185910.0 2166-08-30 18:00:00 98.800003051757812 degF 678\n", + "11 181750.0 2192-11-24 08:00:00 98.5 degF 678\n", + "12 185910.0 2166-08-14 12:00:00 100.40000152587891 degF 678\n", + "13 185910.0 2166-08-14 13:00:00 100.69999694824219 degF 678\n", + "14 185910.0 2166-08-15 22:00:00 99.800003051757812 degF 678\n", + "15 185910.0 2166-08-16 21:00:00 100.59999847412109 degF 678\n", + "16 185910.0 2166-08-23 08:00:00 98 degF 678\n", + "17 190797.0 2191-01-10 08:00:00 97.900001525878906 degF 678\n", + "18 157907.0 2129-06-10 23:00:00 100.09999847412109 degF 678\n", + "19 157907.0 2129-06-11 04:30:00 98.800003051757812 degF 678" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "df_temp_tr = pipeline.transform(df_temp)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"2\" halign=\"left\">degF</th>\n", + " <th colspan=\"2\" halign=\"left\">degC</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762</th>\n", + " <th>676</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"20\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <td>98</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:00:00</th>\n", + " <td>97.9</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:00:00</th>\n", + " <td>99.5</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <td>100</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 01:00:00</th>\n", + " <td>99.9</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 04:00:00</th>\n", + " <td>97.7</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 08:00:00</th>\n", + " <td>97.8</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 12:00:00</th>\n", + " <td>97.5</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 19:00:00</th>\n", + " <td>99.8</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 00:00:00</th>\n", + " <td>99.7</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 04:00:00</th>\n", + " <td>99.3</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 08:00:00</th>\n", + " <td>99.4</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 12:00:00</th>\n", + " <td>98.8</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 16:00:00</th>\n", + " <td>99.3</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 22:00:00</th>\n", + " <td>99.9</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 00:00:00</th>\n", + " <td>99.4</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 04:00:00</th>\n", + " <td>99.6</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 08:00:00</th>\n", + " <td>99</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 13:00:00</th>\n", + " <td>98</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 19:00:00</th>\n", + " <td>99.5</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \n", + "units degF degC \n", + "description 223761 678 223762 676 \n", + "id datetime \n", + "100001 2117-09-11 13:48:00 98 None None None\n", + " 2117-09-11 16:00:00 97.9 None None None\n", + " 2117-09-11 19:00:00 99.5 None None None\n", + " 2117-09-11 22:00:00 100 None None None\n", + " 2117-09-12 01:00:00 99.9 None None None\n", + " 2117-09-12 04:00:00 97.7 None None None\n", + " 2117-09-12 08:00:00 97.8 None None None\n", + " 2117-09-12 12:00:00 97.5 None None None\n", + " 2117-09-12 19:00:00 99.8 None None None\n", + " 2117-09-13 00:00:00 99.7 None None None\n", + " 2117-09-13 04:00:00 99.3 None None None\n", + " 2117-09-13 08:00:00 99.4 None None None\n", + " 2117-09-13 12:00:00 98.8 None None None\n", + " 2117-09-13 16:00:00 99.3 None None None\n", + " 2117-09-13 22:00:00 99.9 None None None\n", + " 2117-09-14 00:00:00 99.4 None None None\n", + " 2117-09-14 04:00:00 99.6 None None None\n", + " 2117-09-14 08:00:00 99 None None None\n", + " 2117-09-14 13:00:00 98 None None None\n", + " 2117-09-14 19:00:00 99.5 None None None" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_tr.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(transformers)\n", + "reload(units)\n", + "reload(icu_data_defs)\n", + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n", + "agg_func = lambda x:x.iloc[0]\n", + "ureg = units.MedicalUreg()\n", + "standard_pipeline = Pipeline([\n", + " ('drop_small_columns',transformers.remove_small_columns(threshold=5)),\n", + " ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func)),\n", + " ('split_dtype',transformers.split_dtype())\n", + " ])\n", + "\n", + "stnd_cols = transformers.column_standardizer(data_dict,ureg)\n", + "drop_oob = transformers.oob_value_remover(data_dict)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "df_temp_cl = standard_pipeline.transform(df_temp_tr)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"2\" halign=\"left\">degF</th>\n", + " <th colspan=\"2\" halign=\"left\">degC</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762</th>\n", + " <th>676</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"20\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:00:00</th>\n", + " <td>97.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:00:00</th>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 01:00:00</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 04:00:00</th>\n", + " <td>97.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 08:00:00</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 12:00:00</th>\n", + " <td>97.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 19:00:00</th>\n", + " <td>99.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 00:00:00</th>\n", + " <td>99.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 04:00:00</th>\n", + " <td>99.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 08:00:00</th>\n", + " <td>99.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 12:00:00</th>\n", + " <td>98.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 16:00:00</th>\n", + " <td>99.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 22:00:00</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 00:00:00</th>\n", + " <td>99.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 04:00:00</th>\n", + " <td>99.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 08:00:00</th>\n", + " <td>99.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 13:00:00</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 19:00:00</th>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \n", + "units degF degC \n", + "description 223761 678 223762 676 \n", + "id datetime \n", + "100001 2117-09-11 13:48:00 98.0 NaN NaN NaN\n", + " 2117-09-11 16:00:00 97.9 NaN NaN NaN\n", + " 2117-09-11 19:00:00 99.5 NaN NaN NaN\n", + " 2117-09-11 22:00:00 100.0 NaN NaN NaN\n", + " 2117-09-12 01:00:00 99.9 NaN NaN NaN\n", + " 2117-09-12 04:00:00 97.7 NaN NaN NaN\n", + " 2117-09-12 08:00:00 97.8 NaN NaN NaN\n", + " 2117-09-12 12:00:00 97.5 NaN NaN NaN\n", + " 2117-09-12 19:00:00 99.8 NaN NaN NaN\n", + " 2117-09-13 00:00:00 99.7 NaN NaN NaN\n", + " 2117-09-13 04:00:00 99.3 NaN NaN NaN\n", + " 2117-09-13 08:00:00 99.4 NaN NaN NaN\n", + " 2117-09-13 12:00:00 98.8 NaN NaN NaN\n", + " 2117-09-13 16:00:00 99.3 NaN NaN NaN\n", + " 2117-09-13 22:00:00 99.9 NaN NaN NaN\n", + " 2117-09-14 00:00:00 99.4 NaN NaN NaN\n", + " 2117-09-14 04:00:00 99.6 NaN NaN NaN\n", + " 2117-09-14 08:00:00 99.0 NaN NaN NaN\n", + " 2117-09-14 13:00:00 98.0 NaN NaN NaN\n", + " 2117-09-14 19:00:00 99.5 NaN NaN NaN" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_cl.head(20)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [], + "source": [ + "df_temp_conv = stnd_cols.transform(df_temp_cl)" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">degF</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762(degC)</th>\n", + " <th>676(degC)</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>522143.000000</td>\n", + " <td>768158.000000</td>\n", + " <td>74144.000000</td>\n", + " <td>370309.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>98.407970</td>\n", + " <td>98.570606</td>\n", + " <td>99.193821</td>\n", + " <td>98.765740</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>14.681127</td>\n", + " <td>2.666614</td>\n", + " <td>9.735224</td>\n", + " <td>2.608901</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>-99.900000</td>\n", + " <td>0.000000</td>\n", + " <td>26.600000</td>\n", + " <td>32.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>97.500000</td>\n", + " <td>97.599998</td>\n", + " <td>97.520000</td>\n", + " <td>97.879998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>98.300000</td>\n", + " <td>98.599998</td>\n", + " <td>98.600000</td>\n", + " <td>98.960002</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>99.300000</td>\n", + " <td>99.599998</td>\n", + " <td>99.680000</td>\n", + " <td>99.860002</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>9637.000000</td>\n", + " <td>109.000000</td>\n", + " <td>709.700000</td>\n", + " <td>115.700000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \n", + "status known \n", + "variable_type qn \n", + "units degF \n", + "description 223761 678 223762(degC) 676(degC)\n", + "count 522143.000000 768158.000000 74144.000000 370309.000000\n", + "mean 98.407970 98.570606 99.193821 98.765740\n", + "std 14.681127 2.666614 9.735224 2.608901\n", + "min -99.900000 0.000000 26.600000 32.000000\n", + "25% 97.500000 97.599998 97.520000 97.879998\n", + "50% 98.300000 98.599998 98.600000 98.960002\n", + "75% 99.300000 99.599998 99.680000 99.860002\n", + "max 9637.000000 109.000000 709.700000 115.700000" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_conv.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "df_temp_no_oob = drop_oob.transform(df_temp_conv)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">degF</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762(degC)</th>\n", + " <th>676(degC)</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>522116.000000</td>\n", + " <td>768158.000000</td>\n", + " <td>73638.000000</td>\n", + " <td>370309.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>98.352642</td>\n", + " <td>98.570606</td>\n", + " <td>98.430646</td>\n", + " <td>98.765740</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>2.825922</td>\n", + " <td>2.666614</td>\n", + " <td>2.467125</td>\n", + " <td>2.608901</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " <td>26.600000</td>\n", + " <td>32.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>97.500000</td>\n", + " <td>97.599998</td>\n", + " <td>97.340000</td>\n", + " <td>97.879998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>98.300000</td>\n", + " <td>98.599998</td>\n", + " <td>98.600000</td>\n", + " <td>98.960002</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>99.300000</td>\n", + " <td>99.599998</td>\n", + " <td>99.680000</td>\n", + " <td>99.860002</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>129.000000</td>\n", + " <td>109.000000</td>\n", + " <td>113.000000</td>\n", + " <td>115.700000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \n", + "status known \n", + "variable_type qn \n", + "units degF \n", + "description 223761 678 223762(degC) 676(degC)\n", + "count 522116.000000 768158.000000 73638.000000 370309.000000\n", + "mean 98.352642 98.570606 98.430646 98.765740\n", + "std 2.825922 2.666614 2.467125 2.608901\n", + "min 0.000000 0.000000 26.600000 32.000000\n", + "25% 97.500000 97.599998 97.340000 97.879998\n", + "50% 98.300000 98.599998 98.600000 98.960002\n", + "75% 99.300000 99.599998 99.680000 99.860002\n", + "max 129.000000 109.000000 113.000000 115.700000" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_no_oob.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "combine_like = transformers.combine_like_cols()\n", + "df_temp_combined = combine_like.transform(df_temp_no_oob)" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th>temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th>known</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th>qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th>degF</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>all</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"24\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <td>98.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:00:00</th>\n", + " <td>97.900000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:00:00</th>\n", + " <td>99.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <td>100.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 01:00:00</th>\n", + " <td>99.900000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 04:00:00</th>\n", + " <td>97.700000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 08:00:00</th>\n", + " <td>97.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 12:00:00</th>\n", + " <td>97.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 19:00:00</th>\n", + " <td>99.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 00:00:00</th>\n", + " <td>99.700000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 04:00:00</th>\n", + " <td>99.300000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 08:00:00</th>\n", + " <td>99.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 12:00:00</th>\n", + " <td>98.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 16:00:00</th>\n", + " <td>99.300000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 22:00:00</th>\n", + " <td>99.900000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 00:00:00</th>\n", + " <td>99.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 04:00:00</th>\n", + " <td>99.600000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 08:00:00</th>\n", + " <td>99.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 13:00:00</th>\n", + " <td>98.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 19:00:00</th>\n", + " <td>99.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 00:00:00</th>\n", + " <td>99.600000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 08:00:00</th>\n", + " <td>98.300000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 12:00:00</th>\n", + " <td>97.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 16:00:00</th>\n", + " <td>98.600000</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"6\" valign=\"top\">100003</th>\n", + " <th>2150-04-17 20:31:00</th>\n", + " <td>95.900000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-17 22:00:00</th>\n", + " <td>98.200000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 00:00:00</th>\n", + " <td>97.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 04:00:00</th>\n", + " <td>98.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 08:00:00</th>\n", + " <td>97.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 11:18:00</th>\n", + " <td>96.300000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"7\" valign=\"top\">199998</th>\n", + " <th>2119-02-21 02:00:00</th>\n", + " <td>100.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-21 03:00:00</th>\n", + " <td>100.220003</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-21 04:00:00</th>\n", + " <td>99.860002</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-21 05:00:00</th>\n", + " <td>100.220003</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-21 06:00:00</th>\n", + " <td>100.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-21 07:00:00</th>\n", + " <td>100.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-21 08:00:00</th>\n", + " <td>100.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"23\" valign=\"top\">199999</th>\n", + " <th>2136-04-06 16:07:00</th>\n", + " <td>97.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-06 20:00:00</th>\n", + " <td>97.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 00:00:00</th>\n", + " <td>97.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 02:00:00</th>\n", + " <td>101.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 05:00:00</th>\n", + " <td>100.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 08:00:00</th>\n", + " <td>99.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 12:00:00</th>\n", + " <td>99.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 15:00:00</th>\n", + " <td>100.700000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 18:00:00</th>\n", + " <td>97.600000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 22:00:00</th>\n", + " <td>98.600000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 04:00:00</th>\n", + " <td>98.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 09:00:00</th>\n", + " <td>97.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 16:00:00</th>\n", + " <td>97.700000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 20:00:00</th>\n", + " <td>99.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 00:00:00</th>\n", + " <td>99.600000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 05:00:00</th>\n", + " <td>99.100000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 08:00:00</th>\n", + " <td>97.800000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 12:00:00</th>\n", + " <td>98.300000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 16:00:00</th>\n", + " <td>98.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 20:00:00</th>\n", + " <td>97.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 00:00:00</th>\n", + " <td>97.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 03:00:00</th>\n", + " <td>97.400000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-10 08:00:00</th>\n", + " <td>98.100000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>1731503 rows × 1 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label temperature body\n", + "status known\n", + "variable_type qn\n", + "units degF\n", + "description all\n", + "id datetime \n", + "100001 2117-09-11 13:48:00 98.000000\n", + " 2117-09-11 16:00:00 97.900000\n", + " 2117-09-11 19:00:00 99.500000\n", + " 2117-09-11 22:00:00 100.000000\n", + " 2117-09-12 01:00:00 99.900000\n", + " 2117-09-12 04:00:00 97.700000\n", + " 2117-09-12 08:00:00 97.800000\n", + " 2117-09-12 12:00:00 97.500000\n", + " 2117-09-12 19:00:00 99.800000\n", + " 2117-09-13 00:00:00 99.700000\n", + " 2117-09-13 04:00:00 99.300000\n", + " 2117-09-13 08:00:00 99.400000\n", + " 2117-09-13 12:00:00 98.800000\n", + " 2117-09-13 16:00:00 99.300000\n", + " 2117-09-13 22:00:00 99.900000\n", + " 2117-09-14 00:00:00 99.400000\n", + " 2117-09-14 04:00:00 99.600000\n", + " 2117-09-14 08:00:00 99.000000\n", + " 2117-09-14 13:00:00 98.000000\n", + " 2117-09-14 19:00:00 99.500000\n", + " 2117-09-15 00:00:00 99.600000\n", + " 2117-09-15 08:00:00 98.300000\n", + " 2117-09-15 12:00:00 97.800000\n", + " 2117-09-15 16:00:00 98.600000\n", + "100003 2150-04-17 20:31:00 95.900000\n", + " 2150-04-17 22:00:00 98.200000\n", + " 2150-04-18 00:00:00 97.400000\n", + " 2150-04-18 04:00:00 98.000000\n", + " 2150-04-18 08:00:00 97.400000\n", + " 2150-04-18 11:18:00 96.300000\n", + "... ...\n", + "199998 2119-02-21 02:00:00 100.400000\n", + " 2119-02-21 03:00:00 100.220003\n", + " 2119-02-21 04:00:00 99.860002\n", + " 2119-02-21 05:00:00 100.220003\n", + " 2119-02-21 06:00:00 100.400000\n", + " 2119-02-21 07:00:00 100.400000\n", + " 2119-02-21 08:00:00 100.400000\n", + "199999 2136-04-06 16:07:00 97.800000\n", + " 2136-04-06 20:00:00 97.500000\n", + " 2136-04-07 00:00:00 97.400000\n", + " 2136-04-07 02:00:00 101.000000\n", + " 2136-04-07 05:00:00 100.500000\n", + " 2136-04-07 08:00:00 99.000000\n", + " 2136-04-07 12:00:00 99.800000\n", + " 2136-04-07 15:00:00 100.700000\n", + " 2136-04-07 18:00:00 97.600000\n", + " 2136-04-07 22:00:00 98.600000\n", + " 2136-04-08 04:00:00 98.500000\n", + " 2136-04-08 09:00:00 97.800000\n", + " 2136-04-08 16:00:00 97.700000\n", + " 2136-04-08 20:00:00 99.000000\n", + " 2136-04-09 00:00:00 99.600000\n", + " 2136-04-09 05:00:00 99.100000\n", + " 2136-04-09 08:00:00 97.800000\n", + " 2136-04-09 12:00:00 98.300000\n", + " 2136-04-09 16:00:00 98.000000\n", + " 2136-04-09 20:00:00 97.400000\n", + " 2136-04-10 00:00:00 97.400000\n", + " 2136-04-10 03:00:00 97.400000\n", + " 2136-04-10 08:00:00 98.100000\n", + "\n", + "[1731503 rows x 1 columns]" + ] + }, + "execution_count": 28, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_combined" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Segmenting" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import segmenting" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "df_context = utils.open_df('data/mimic_data','context')" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>pt_id</th>\n", + " <th>id</th>\n", + " <th>start_dt</th>\n", + " <th>end_dt</th>\n", + " <th>lang</th>\n", + " <th>religion</th>\n", + " <th>marital_status</th>\n", + " <th>ethnicity</th>\n", + " <th>dx_info</th>\n", + " <th>admission_location</th>\n", + " <th>...</th>\n", + " <th>dod</th>\n", + " <th>icd_codes</th>\n", + " <th>age</th>\n", + " <th>icustay_id</th>\n", + " <th>dbsource</th>\n", + " <th>first_icu</th>\n", + " <th>last_icu</th>\n", + " <th>intime</th>\n", + " <th>outtime</th>\n", + " <th>los</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>87</td>\n", + " <td>190659</td>\n", + " <td>2191-02-25 20:30:00</td>\n", + " <td>2191-04-25 15:18:00</td>\n", + " <td></td>\n", + " <td>UNOBTAINABLE</td>\n", + " <td></td>\n", + " <td>UNKNOWN/NOT SPECIFIED</td>\n", + " <td>NEWBORN</td>\n", + " <td>PHYS REFERRAL/NORMAL DELI</td>\n", + " <td>...</td>\n", + " <td>None</td>\n", + " <td>[V3101, 76515, 76524, 769, 7707, 7775, 7742, 7...</td>\n", + " <td>0 days 20:30:00</td>\n", + " <td>277633.0</td>\n", + " <td>carevue</td>\n", + " <td>NICU</td>\n", + " <td>NICU</td>\n", + " <td>2191-02-25 21:09:05</td>\n", + " <td>2191-04-25 15:38:56</td>\n", + " <td>58.7707</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>88</td>\n", + " <td>123010</td>\n", + " <td>2111-08-29 03:03:00</td>\n", + " <td>2111-09-03 14:24:00</td>\n", + " <td></td>\n", + " <td></td>\n", + " <td></td>\n", + " <td>BLACK/AFRICAN AMERICAN</td>\n", + " <td>S/P MOTOR VEHICLE ACCIDENT-STABBING</td>\n", + " <td>EMERGENCY ROOM ADMIT</td>\n", + " <td>...</td>\n", + " <td>None</td>\n", + " <td>[86113, 5119, 4239, E966]</td>\n", + " <td>10467 days 03:03:00</td>\n", + " <td>297289.0</td>\n", + " <td>carevue</td>\n", + " <td>TSICU</td>\n", + " <td>TSICU</td>\n", + " <td>2111-08-29 03:04:42</td>\n", + " <td>2111-08-30 21:08:09</td>\n", + " <td>1.7524</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>89</td>\n", + " <td>188646</td>\n", + " <td>2185-06-17 05:22:00</td>\n", + " <td>2185-06-21 11:15:00</td>\n", + " <td></td>\n", + " <td>UNOBTAINABLE</td>\n", + " <td></td>\n", + " <td>UNKNOWN/NOT SPECIFIED</td>\n", + " <td>NEWBORN</td>\n", + " <td>PHYS REFERRAL/NORMAL DELI</td>\n", + " <td>...</td>\n", + " <td>None</td>\n", + " <td>[V3101, 7742, 76516, 76527, 22801, V290]</td>\n", + " <td>0 days 05:22:00</td>\n", + " <td>249786.0</td>\n", + " <td>carevue</td>\n", + " <td>NICU</td>\n", + " <td>NICU</td>\n", + " <td>2185-06-17 05:46:00</td>\n", + " <td>2185-06-21 12:00:41</td>\n", + " <td>4.2602</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>91</td>\n", + " <td>121205</td>\n", + " <td>2177-04-23 00:08:00</td>\n", + " <td>2177-05-10 15:16:00</td>\n", + " <td></td>\n", + " <td>JEWISH</td>\n", + " <td>MARRIED</td>\n", + " <td>WHITE</td>\n", + " <td>FEVER</td>\n", + " <td>EMERGENCY ROOM ADMIT</td>\n", + " <td>...</td>\n", + " <td>2177-05-10 00:00:00</td>\n", + " <td>[20008, 2765, 5559, 99812, 51881, 4470, 135, 5...</td>\n", + " <td>29794 days 00:08:00</td>\n", + " <td>218528.0</td>\n", + " <td>carevue</td>\n", + " <td>CSRU</td>\n", + " <td>CSRU</td>\n", + " <td>2177-04-27 02:08:00</td>\n", + " <td>2177-04-27 14:03:00</td>\n", + " <td>0.4965</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>91</td>\n", + " <td>121205</td>\n", + " <td>2177-04-23 00:08:00</td>\n", + " <td>2177-05-10 15:16:00</td>\n", + " <td></td>\n", + " <td>JEWISH</td>\n", + " <td>MARRIED</td>\n", + " <td>WHITE</td>\n", + " <td>FEVER</td>\n", + " <td>EMERGENCY ROOM ADMIT</td>\n", + " <td>...</td>\n", + " <td>2177-05-10 00:00:00</td>\n", + " <td>[20008, 2765, 5559, 99812, 51881, 4470, 135, 5...</td>\n", + " <td>29794 days 00:08:00</td>\n", + " <td>256972.0</td>\n", + " <td>carevue</td>\n", + " <td>MICU</td>\n", + " <td>MICU</td>\n", + " <td>2177-05-07 03:52:00</td>\n", + " <td>2177-05-10 15:16:00</td>\n", + " <td>3.4750</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>5 rows × 22 columns</p>\n", + "</div>" + ], + "text/plain": [ + " pt_id id start_dt end_dt lang religion \\\n", + "0 87 190659 2191-02-25 20:30:00 2191-04-25 15:18:00 UNOBTAINABLE \n", + "1 88 123010 2111-08-29 03:03:00 2111-09-03 14:24:00 \n", + "2 89 188646 2185-06-17 05:22:00 2185-06-21 11:15:00 UNOBTAINABLE \n", + "3 91 121205 2177-04-23 00:08:00 2177-05-10 15:16:00 JEWISH \n", + "4 91 121205 2177-04-23 00:08:00 2177-05-10 15:16:00 JEWISH \n", + "\n", + " marital_status ethnicity dx_info \\\n", + "0 UNKNOWN/NOT SPECIFIED NEWBORN \n", + "1 BLACK/AFRICAN AMERICAN S/P MOTOR VEHICLE ACCIDENT-STABBING \n", + "2 UNKNOWN/NOT SPECIFIED NEWBORN \n", + "3 MARRIED WHITE FEVER \n", + "4 MARRIED WHITE FEVER \n", + "\n", + " admission_location ... dod \\\n", + "0 PHYS REFERRAL/NORMAL DELI ... None \n", + "1 EMERGENCY ROOM ADMIT ... None \n", + "2 PHYS REFERRAL/NORMAL DELI ... None \n", + "3 EMERGENCY ROOM ADMIT ... 2177-05-10 00:00:00 \n", + "4 EMERGENCY ROOM ADMIT ... 2177-05-10 00:00:00 \n", + "\n", + " icd_codes age \\\n", + "0 [V3101, 76515, 76524, 769, 7707, 7775, 7742, 7... 0 days 20:30:00 \n", + "1 [86113, 5119, 4239, E966] 10467 days 03:03:00 \n", + "2 [V3101, 7742, 76516, 76527, 22801, V290] 0 days 05:22:00 \n", + "3 [20008, 2765, 5559, 99812, 51881, 4470, 135, 5... 29794 days 00:08:00 \n", + "4 [20008, 2765, 5559, 99812, 51881, 4470, 135, 5... 29794 days 00:08:00 \n", + "\n", + " icustay_id dbsource first_icu last_icu intime \\\n", + "0 277633.0 carevue NICU NICU 2191-02-25 21:09:05 \n", + "1 297289.0 carevue TSICU TSICU 2111-08-29 03:04:42 \n", + "2 249786.0 carevue NICU NICU 2185-06-17 05:46:00 \n", + "3 218528.0 carevue CSRU CSRU 2177-04-27 02:08:00 \n", + "4 256972.0 carevue MICU MICU 2177-05-07 03:52:00 \n", + "\n", + " outtime los \n", + "0 2191-04-25 15:38:56 58.7707 \n", + "1 2111-08-30 21:08:09 1.7524 \n", + "2 2185-06-21 12:00:41 4.2602 \n", + "3 2177-04-27 14:03:00 0.4965 \n", + "4 2177-05-10 15:16:00 3.4750 \n", + "\n", + "[5 rows x 22 columns]" + ] + }, + "execution_count": 31, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_context.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "end_dt = df_temp_combined.iloc[:,0].groupby(level='id').apply(lambda x:x.sample(1))\n", + "end_dt = end_dt.reset_index(level=0,drop=True).reset_index(level=1,drop=False).iloc[:,0]" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(segmenting)\n", + "reload(utils)\n", + "all_before = segmenting.all_before(end_dt,df_context)\n", + "n_hrs_before = segmenting.n_hrs_before(end_dt,10)\n", + "periodic = segmenting.periodic(10,df_context)" + ] + }, + { + "cell_type": "code", + "execution_count": 138, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "C:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\tools\\merge.py:480: UserWarning: merging between different levels can give an unintended result (3 levels on the left, 1 on the right)\n", + " warnings.warn(msg, UserWarning)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"2\" halign=\"left\">degF</th>\n", + " <th colspan=\"2\" halign=\"left\">degC</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762</th>\n", + " <th>676</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>seg_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"8\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <th>0</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:00:00</th>\n", + " <th>0</th>\n", + " <td>97.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:00:00</th>\n", + " <th>0</th>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <th>0</th>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 01:00:00</th>\n", + " <th>0</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 04:00:00</th>\n", + " <th>0</th>\n", + " <td>97.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 08:00:00</th>\n", + " <th>0</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 12:00:00</th>\n", + " <th>0</th>\n", + " <td>97.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100003</th>\n", + " <th>2150-04-17 20:31:00</th>\n", + " <th>0</th>\n", + " <td>95.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-17 22:00:00</th>\n", + " <th>0</th>\n", + " <td>98.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 00:00:00</th>\n", + " <th>0</th>\n", + " <td>97.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"19\" valign=\"top\">100006</th>\n", + " <th>2108-04-06 16:30:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-06 20:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-07 00:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-07 04:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-07 08:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.099998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-07 12:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-07 20:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-08 00:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.599998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-08 04:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-08 08:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-08 12:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-08 16:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-08 20:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-09 00:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-09 04:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-09 08:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.099998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-09 12:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-09 20:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.599998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2108-04-10 00:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"10\" valign=\"top\">199998</th>\n", + " <th>2119-02-20 17:15:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.299999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 17:30:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 17:45:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.599998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 18:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.900002</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 18:30:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.200001</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 19:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.599998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 20:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.799999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 21:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.799999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 22:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.799999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2119-02-20 23:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.700001</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"20\" valign=\"top\">199999</th>\n", + " <th>2136-04-06 16:07:00</th>\n", + " <th>0</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-06 20:00:00</th>\n", + " <th>0</th>\n", + " <td>97.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 00:00:00</th>\n", + " <th>0</th>\n", + " <td>97.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 02:00:00</th>\n", + " <th>0</th>\n", + " <td>101.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 05:00:00</th>\n", + " <th>0</th>\n", + " <td>100.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 08:00:00</th>\n", + " <th>0</th>\n", + " <td>99.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 12:00:00</th>\n", + " <th>0</th>\n", + " <td>99.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 15:00:00</th>\n", + " <th>0</th>\n", + " <td>100.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 18:00:00</th>\n", + " <th>0</th>\n", + " <td>97.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-07 22:00:00</th>\n", + " <th>0</th>\n", + " <td>98.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 04:00:00</th>\n", + " <th>0</th>\n", + " <td>98.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 09:00:00</th>\n", + " <th>0</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 16:00:00</th>\n", + " <th>0</th>\n", + " <td>97.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-08 20:00:00</th>\n", + " <th>0</th>\n", + " <td>99.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 00:00:00</th>\n", + " <th>0</th>\n", + " <td>99.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 05:00:00</th>\n", + " <th>0</th>\n", + " <td>99.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 08:00:00</th>\n", + " <th>0</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 12:00:00</th>\n", + " <th>0</th>\n", + " <td>98.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 16:00:00</th>\n", + " <th>0</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2136-04-09 20:00:00</th>\n", + " <th>0</th>\n", + " <td>97.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>839877 rows × 4 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \\\n", + "units degF degC \n", + "description 223761 678 223762 \n", + "id datetime seg_id \n", + "100001 2117-09-11 13:48:00 0 98.0 NaN NaN \n", + " 2117-09-11 16:00:00 0 97.9 NaN NaN \n", + " 2117-09-11 19:00:00 0 99.5 NaN NaN \n", + " 2117-09-11 22:00:00 0 100.0 NaN NaN \n", + " 2117-09-12 01:00:00 0 99.9 NaN NaN \n", + " 2117-09-12 04:00:00 0 97.7 NaN NaN \n", + " 2117-09-12 08:00:00 0 97.8 NaN NaN \n", + " 2117-09-12 12:00:00 0 97.5 NaN NaN \n", + "100003 2150-04-17 20:31:00 0 95.9 NaN NaN \n", + " 2150-04-17 22:00:00 0 98.2 NaN NaN \n", + " 2150-04-18 00:00:00 0 97.4 NaN NaN \n", + "100006 2108-04-06 16:30:00 0 NaN 97.000000 NaN \n", + " 2108-04-06 20:00:00 0 NaN 97.400002 NaN \n", + " 2108-04-07 00:00:00 0 NaN 97.800003 NaN \n", + " 2108-04-07 04:00:00 0 NaN 97.000000 NaN \n", + " 2108-04-07 08:00:00 0 NaN 97.099998 NaN \n", + " 2108-04-07 12:00:00 0 NaN 97.000000 NaN \n", + " 2108-04-07 20:00:00 0 NaN 98.800003 NaN \n", + " 2108-04-08 00:00:00 0 NaN 98.599998 NaN \n", + " 2108-04-08 04:00:00 0 NaN 98.000000 NaN \n", + " 2108-04-08 08:00:00 0 NaN 97.199997 NaN \n", + " 2108-04-08 12:00:00 0 NaN 97.000000 NaN \n", + " 2108-04-08 16:00:00 0 NaN 98.000000 NaN \n", + " 2108-04-08 20:00:00 0 NaN 98.800003 NaN \n", + " 2108-04-09 00:00:00 0 NaN 97.199997 NaN \n", + " 2108-04-09 04:00:00 0 NaN 97.400002 NaN \n", + " 2108-04-09 08:00:00 0 NaN 97.099998 NaN \n", + " 2108-04-09 12:00:00 0 NaN 97.300003 NaN \n", + " 2108-04-09 20:00:00 0 NaN 97.599998 NaN \n", + " 2108-04-10 00:00:00 0 NaN 97.000000 NaN \n", + "... ... ... ... \n", + "199998 2119-02-20 17:15:00 0 NaN NaN NaN \n", + " 2119-02-20 17:30:00 0 NaN NaN NaN \n", + " 2119-02-20 17:45:00 0 NaN NaN NaN \n", + " 2119-02-20 18:00:00 0 NaN NaN NaN \n", + " 2119-02-20 18:30:00 0 NaN NaN NaN \n", + " 2119-02-20 19:00:00 0 NaN NaN NaN \n", + " 2119-02-20 20:00:00 0 NaN NaN NaN \n", + " 2119-02-20 21:00:00 0 NaN NaN NaN \n", + " 2119-02-20 22:00:00 0 NaN NaN NaN \n", + " 2119-02-20 23:00:00 0 NaN NaN NaN \n", + "199999 2136-04-06 16:07:00 0 97.8 NaN NaN \n", + " 2136-04-06 20:00:00 0 97.5 NaN NaN \n", + " 2136-04-07 00:00:00 0 97.4 NaN NaN \n", + " 2136-04-07 02:00:00 0 101.0 NaN NaN \n", + " 2136-04-07 05:00:00 0 100.5 NaN NaN \n", + " 2136-04-07 08:00:00 0 99.0 NaN NaN \n", + " 2136-04-07 12:00:00 0 99.8 NaN NaN \n", + " 2136-04-07 15:00:00 0 100.7 NaN NaN \n", + " 2136-04-07 18:00:00 0 97.6 NaN NaN \n", + " 2136-04-07 22:00:00 0 98.6 NaN NaN \n", + " 2136-04-08 04:00:00 0 98.5 NaN NaN \n", + " 2136-04-08 09:00:00 0 97.8 NaN NaN \n", + " 2136-04-08 16:00:00 0 97.7 NaN NaN \n", + " 2136-04-08 20:00:00 0 99.0 NaN NaN \n", + " 2136-04-09 00:00:00 0 99.6 NaN NaN \n", + " 2136-04-09 05:00:00 0 99.1 NaN NaN \n", + " 2136-04-09 08:00:00 0 97.8 NaN NaN \n", + " 2136-04-09 12:00:00 0 98.3 NaN NaN \n", + " 2136-04-09 16:00:00 0 98.0 NaN NaN \n", + " 2136-04-09 20:00:00 0 97.4 NaN NaN \n", + "\n", + "label \n", + "units \n", + "description 676 \n", + "id datetime seg_id \n", + "100001 2117-09-11 13:48:00 0 NaN \n", + " 2117-09-11 16:00:00 0 NaN \n", + " 2117-09-11 19:00:00 0 NaN \n", + " 2117-09-11 22:00:00 0 NaN \n", + " 2117-09-12 01:00:00 0 NaN \n", + " 2117-09-12 04:00:00 0 NaN \n", + " 2117-09-12 08:00:00 0 NaN \n", + " 2117-09-12 12:00:00 0 NaN \n", + "100003 2150-04-17 20:31:00 0 NaN \n", + " 2150-04-17 22:00:00 0 NaN \n", + " 2150-04-18 00:00:00 0 NaN \n", + "100006 2108-04-06 16:30:00 0 NaN \n", + " 2108-04-06 20:00:00 0 NaN \n", + " 2108-04-07 00:00:00 0 NaN \n", + " 2108-04-07 04:00:00 0 NaN \n", + " 2108-04-07 08:00:00 0 NaN \n", + " 2108-04-07 12:00:00 0 NaN \n", + " 2108-04-07 20:00:00 0 NaN \n", + " 2108-04-08 00:00:00 0 NaN \n", + " 2108-04-08 04:00:00 0 NaN \n", + " 2108-04-08 08:00:00 0 NaN \n", + " 2108-04-08 12:00:00 0 NaN \n", + " 2108-04-08 16:00:00 0 NaN \n", + " 2108-04-08 20:00:00 0 NaN \n", + " 2108-04-09 00:00:00 0 NaN \n", + " 2108-04-09 04:00:00 0 NaN \n", + " 2108-04-09 08:00:00 0 NaN \n", + " 2108-04-09 12:00:00 0 NaN \n", + " 2108-04-09 20:00:00 0 NaN \n", + " 2108-04-10 00:00:00 0 NaN \n", + "... ... \n", + "199998 2119-02-20 17:15:00 0 36.299999 \n", + " 2119-02-20 17:30:00 0 36.500000 \n", + " 2119-02-20 17:45:00 0 36.599998 \n", + " 2119-02-20 18:00:00 0 36.900002 \n", + " 2119-02-20 18:30:00 0 37.200001 \n", + " 2119-02-20 19:00:00 0 37.599998 \n", + " 2119-02-20 20:00:00 0 37.799999 \n", + " 2119-02-20 21:00:00 0 37.799999 \n", + " 2119-02-20 22:00:00 0 37.799999 \n", + " 2119-02-20 23:00:00 0 37.700001 \n", + "199999 2136-04-06 16:07:00 0 NaN \n", + " 2136-04-06 20:00:00 0 NaN \n", + " 2136-04-07 00:00:00 0 NaN \n", + " 2136-04-07 02:00:00 0 NaN \n", + " 2136-04-07 05:00:00 0 NaN \n", + " 2136-04-07 08:00:00 0 NaN \n", + " 2136-04-07 12:00:00 0 NaN \n", + " 2136-04-07 15:00:00 0 NaN \n", + " 2136-04-07 18:00:00 0 NaN \n", + " 2136-04-07 22:00:00 0 NaN \n", + " 2136-04-08 04:00:00 0 NaN \n", + " 2136-04-08 09:00:00 0 NaN \n", + " 2136-04-08 16:00:00 0 NaN \n", + " 2136-04-08 20:00:00 0 NaN \n", + " 2136-04-09 00:00:00 0 NaN \n", + " 2136-04-09 05:00:00 0 NaN \n", + " 2136-04-09 08:00:00 0 NaN \n", + " 2136-04-09 12:00:00 0 NaN \n", + " 2136-04-09 16:00:00 0 NaN \n", + " 2136-04-09 20:00:00 0 NaN \n", + "\n", + "[839877 rows x 4 columns]" + ] + }, + "execution_count": 138, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_all_before = all_before.transform(df_temp_cl)\n", + "df_temp_all_before[df_temp_all_before.index.get_level_values('seg_id') > -1]" + ] + }, + { + "cell_type": "code", + "execution_count": 262, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " seg_id\n", + "id datetime \n", + "100001 2117-09-11 22:00:00 0\n", + " 2117-09-12 01:00:00 0\n", + " 2117-09-12 04:00:00 0\n", + "100006 2108-04-07 20:00:00 0\n", + "100007 2145-04-04 00:00:00 0\n", + " 2145-04-04 04:00:00 0\n", + "100009 2162-05-19 03:00:00 0\n", + "100010 2109-12-10 22:47:00 0\n", + " 2109-12-11 00:00:00 0\n", + "100011 2177-09-07 09:00:00 0\n", + " 2177-09-07 13:00:00 0\n", + " 2177-09-07 17:00:00 0\n", + "label temperature body \n", + "status known \n", + "variable_type qn \n", + "units degF \n", + "description 223761 678 223762(degC) 676(degC)\n", + "id datetime seg_id \n", + "100001 2117-09-11 13:48:00 -1 98.0 NaN NaN NaN\n", + " 2117-09-11 16:00:00 -1 97.9 NaN NaN NaN\n", + " 2117-09-11 19:00:00 -1 99.5 NaN NaN NaN\n", + " 2117-09-11 22:00:00 0 100.0 NaN NaN NaN\n", + " 2117-09-12 01:00:00 0 99.9 NaN NaN NaN\n", + " 2117-09-12 04:00:00 0 97.7 NaN NaN NaN\n", + " 2117-09-12 08:00:00 -1 97.8 NaN NaN NaN\n", + " 2117-09-12 12:00:00 -1 97.5 NaN NaN NaN\n", + " 2117-09-12 19:00:00 -1 99.8 NaN NaN NaN\n", + " 2117-09-13 00:00:00 -1 99.7 NaN NaN NaN\n", + " 2117-09-13 04:00:00 -1 99.3 NaN NaN NaN\n", + " 2117-09-13 08:00:00 -1 99.4 NaN NaN NaN\n", + " 2117-09-13 12:00:00 -1 98.8 NaN NaN NaN\n", + " 2117-09-13 16:00:00 -1 99.3 NaN NaN NaN\n", + " 2117-09-13 22:00:00 -1 99.9 NaN NaN NaN\n", + " 2117-09-14 00:00:00 -1 99.4 NaN NaN NaN\n", + " 2117-09-14 04:00:00 -1 99.6 NaN NaN NaN\n", + " 2117-09-14 08:00:00 -1 99.0 NaN NaN NaN\n", + " 2117-09-14 13:00:00 -1 98.0 NaN NaN NaN\n", + " 2117-09-14 19:00:00 -1 99.5 NaN NaN NaN\n", + " 2117-09-15 00:00:00 -1 99.6 NaN NaN NaN\n", + " 2117-09-15 08:00:00 -1 98.3 NaN NaN NaN\n", + " 2117-09-15 12:00:00 -1 97.8 NaN NaN NaN\n", + " 2117-09-15 16:00:00 -1 98.6 NaN NaN NaN\n", + "100003 2150-04-17 20:31:00 -1 95.9 NaN NaN NaN\n", + " 2150-04-17 22:00:00 -1 98.2 NaN NaN NaN\n", + " 2150-04-18 00:00:00 -1 97.4 NaN NaN NaN\n", + " 2150-04-18 04:00:00 -1 98.0 NaN NaN NaN\n", + " 2150-04-18 08:00:00 -1 97.4 NaN NaN NaN\n", + " 2150-04-18 11:18:00 -1 96.3 NaN NaN NaN\n", + "... ... .. ... ...\n", + "100011 2177-09-04 19:00:00 -1 101.0 NaN NaN NaN\n", + " 2177-09-04 20:00:00 -1 101.2 NaN NaN NaN\n", + " 2177-09-04 22:00:00 -1 102.1 NaN NaN NaN\n", + " 2177-09-05 00:00:00 -1 101.8 NaN NaN NaN\n", + " 2177-09-05 02:00:00 -1 100.8 NaN NaN NaN\n", + " 2177-09-05 04:00:00 -1 100.1 NaN NaN NaN\n", + " 2177-09-05 06:00:00 -1 100.1 NaN NaN NaN\n", + " 2177-09-05 08:00:00 -1 99.5 NaN NaN NaN\n", + " 2177-09-05 10:00:00 -1 101.4 NaN NaN NaN\n", + " 2177-09-05 12:00:00 -1 101.1 NaN NaN NaN\n", + " 2177-09-05 14:00:00 -1 99.8 NaN NaN NaN\n", + " 2177-09-05 16:00:00 -1 97.5 NaN NaN NaN\n", + " 2177-09-05 20:00:00 -1 102.0 NaN NaN NaN\n", + " 2177-09-05 23:00:00 -1 100.8 NaN NaN NaN\n", + " 2177-09-06 02:00:00 -1 101.0 NaN NaN NaN\n", + " 2177-09-06 04:00:00 -1 101.2 NaN NaN NaN\n", + " 2177-09-06 08:00:00 -1 100.1 NaN NaN NaN\n", + " 2177-09-06 12:00:00 -1 100.1 NaN NaN NaN\n", + " 2177-09-06 16:00:00 -1 102.7 NaN NaN NaN\n", + " 2177-09-06 18:00:00 -1 102.0 NaN NaN NaN\n", + " 2177-09-06 20:00:00 -1 101.3 NaN NaN NaN\n", + " 2177-09-06 23:00:00 -1 101.9 NaN NaN NaN\n", + " 2177-09-07 00:00:00 -1 99.9 NaN NaN NaN\n", + " 2177-09-07 04:00:00 -1 100.5 NaN NaN NaN\n", + " 2177-09-07 09:00:00 0 99.5 NaN NaN NaN\n", + " 2177-09-07 13:00:00 0 99.1 NaN NaN NaN\n", + " 2177-09-07 17:00:00 0 99.2 NaN NaN NaN\n", + " 2177-09-07 19:00:00 -1 99.9 NaN NaN NaN\n", + " 2177-09-08 00:00:00 -1 99.8 NaN NaN NaN\n", + " 2177-09-08 04:00:00 -1 99.5 NaN NaN NaN\n", + "\n", + "[200 rows x 4 columns]\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">degF</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762(degC)</th>\n", + " <th>676(degC)</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>seg_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <th>0</th>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 01:00:00</th>\n", + " <th>0</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 04:00:00</th>\n", + " <th>0</th>\n", + " <td>97.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100006</th>\n", + " <th>2108-04-07 20:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100007</th>\n", + " <th>2145-04-04 00:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>98.699997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2145-04-04 04:00:00</th>\n", + " <th>0</th>\n", + " <td>NaN</td>\n", + " <td>97.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100009</th>\n", + " <th>2162-05-19 03:00:00</th>\n", + " <th>0</th>\n", + " <td>98.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100010</th>\n", + " <th>2109-12-10 22:47:00</th>\n", + " <th>0</th>\n", + " <td>100.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2109-12-11 00:00:00</th>\n", + " <th>0</th>\n", + " <td>98.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100011</th>\n", + " <th>2177-09-07 09:00:00</th>\n", + " <th>0</th>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-09-07 13:00:00</th>\n", + " <th>0</th>\n", + " <td>99.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2177-09-07 17:00:00</th>\n", + " <th>0</th>\n", + " <td>99.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \\\n", + "status known \n", + "variable_type qn \n", + "units degF \n", + "description 223761 678 223762(degC) \n", + "id datetime seg_id \n", + "100001 2117-09-11 22:00:00 0 100.0 NaN NaN \n", + " 2117-09-12 01:00:00 0 99.9 NaN NaN \n", + " 2117-09-12 04:00:00 0 97.7 NaN NaN \n", + "100006 2108-04-07 20:00:00 0 NaN 98.800003 NaN \n", + "100007 2145-04-04 00:00:00 0 NaN 98.699997 NaN \n", + " 2145-04-04 04:00:00 0 NaN 97.400002 NaN \n", + "100009 2162-05-19 03:00:00 0 98.6 NaN NaN \n", + "100010 2109-12-10 22:47:00 0 100.2 NaN NaN \n", + " 2109-12-11 00:00:00 0 98.8 NaN NaN \n", + "100011 2177-09-07 09:00:00 0 99.5 NaN NaN \n", + " 2177-09-07 13:00:00 0 99.1 NaN NaN \n", + " 2177-09-07 17:00:00 0 99.2 NaN NaN \n", + "\n", + "label \n", + "status \n", + "variable_type \n", + "units \n", + "description 676(degC) \n", + "id datetime seg_id \n", + "100001 2117-09-11 22:00:00 0 NaN \n", + " 2117-09-12 01:00:00 0 NaN \n", + " 2117-09-12 04:00:00 0 NaN \n", + "100006 2108-04-07 20:00:00 0 NaN \n", + "100007 2145-04-04 00:00:00 0 NaN \n", + " 2145-04-04 04:00:00 0 NaN \n", + "100009 2162-05-19 03:00:00 0 NaN \n", + "100010 2109-12-10 22:47:00 0 NaN \n", + " 2109-12-11 00:00:00 0 NaN \n", + "100011 2177-09-07 09:00:00 0 NaN \n", + " 2177-09-07 13:00:00 0 NaN \n", + " 2177-09-07 17:00:00 0 NaN " + ] + }, + "execution_count": 262, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_Nhr_before = n_hrs_before.transform(df_temp_combined.head(200))\n", + "df_temp_Nhr_before[df_temp_Nhr_before.index.get_level_values('seg_id') > -1]" + ] + }, + { + "cell_type": "code", + "execution_count": 266, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>label</th>\n", + " <th colspan=\"4\" halign=\"left\">temperature body</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"4\" halign=\"left\">known</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"4\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"4\" halign=\"left\">degF</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>223761</th>\n", + " <th>678</th>\n", + " <th>223762(degC)</th>\n", + " <th>676(degC)</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>seg_id</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"24\" valign=\"top\">100001</th>\n", + " <th>2117-09-11 13:48:00</th>\n", + " <th>0</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 16:00:00</th>\n", + " <th>0</th>\n", + " <td>97.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 19:00:00</th>\n", + " <th>0</th>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-11 22:00:00</th>\n", + " <th>1</th>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 01:00:00</th>\n", + " <th>1</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 04:00:00</th>\n", + " <th>1</th>\n", + " <td>97.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 08:00:00</th>\n", + " <th>2</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 12:00:00</th>\n", + " <th>2</th>\n", + " <td>97.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-12 19:00:00</th>\n", + " <th>3</th>\n", + " <td>99.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 00:00:00</th>\n", + " <th>3</th>\n", + " <td>99.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 04:00:00</th>\n", + " <th>4</th>\n", + " <td>99.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 08:00:00</th>\n", + " <th>4</th>\n", + " <td>99.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 12:00:00</th>\n", + " <th>4</th>\n", + " <td>98.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 16:00:00</th>\n", + " <th>5</th>\n", + " <td>99.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-13 22:00:00</th>\n", + " <th>5</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 00:00:00</th>\n", + " <th>6</th>\n", + " <td>99.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 04:00:00</th>\n", + " <th>6</th>\n", + " <td>99.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 08:00:00</th>\n", + " <th>6</th>\n", + " <td>99.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 13:00:00</th>\n", + " <th>7</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-14 19:00:00</th>\n", + " <th>7</th>\n", + " <td>99.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 00:00:00</th>\n", + " <th>8</th>\n", + " <td>99.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 08:00:00</th>\n", + " <th>9</th>\n", + " <td>98.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 12:00:00</th>\n", + " <th>9</th>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2117-09-15 16:00:00</th>\n", + " <th>10</th>\n", + " <td>98.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"6\" valign=\"top\">100003</th>\n", + " <th>2150-04-17 20:31:00</th>\n", + " <th>0</th>\n", + " <td>95.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-17 22:00:00</th>\n", + " <th>0</th>\n", + " <td>98.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 00:00:00</th>\n", + " <th>0</th>\n", + " <td>97.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 04:00:00</th>\n", + " <th>1</th>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 08:00:00</th>\n", + " <th>1</th>\n", + " <td>97.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2150-04-18 11:18:00</th>\n", + " <th>1</th>\n", + " <td>96.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"16\" valign=\"top\">100114</th>\n", + " <th>2157-09-19 18:15:00</th>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-19 18:30:00</th>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-19 20:00:00</th>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-19 23:00:00</th>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 00:00:00</th>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.599998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 01:00:00</th>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 01:15:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>98.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 02:00:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>97.099998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 06:00:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>98.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 08:00:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>96.699997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 09:15:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>96.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 09:30:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 10:00:00</th>\n", + " <th>4</th>\n", + " <td>NaN</td>\n", + " <td>96.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 12:00:00</th>\n", + " <th>5</th>\n", + " <td>NaN</td>\n", + " <td>97.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 15:00:00</th>\n", + " <th>5</th>\n", + " <td>NaN</td>\n", + " <td>98.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2157-09-20 18:00:00</th>\n", + " <th>5</th>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"13\" valign=\"top\">100116</th>\n", + " <th>2173-07-27 05:13:00</th>\n", + " <th>0</th>\n", + " <td>98.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 08:00:00</th>\n", + " <th>0</th>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 09:30:00</th>\n", + " <th>0</th>\n", + " <td>99.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 11:00:00</th>\n", + " <th>0</th>\n", + " <td>98.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 14:25:00</th>\n", + " <th>0</th>\n", + " <td>100.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 16:30:00</th>\n", + " <th>1</th>\n", + " <td>100.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 18:00:00</th>\n", + " <th>1</th>\n", + " <td>99.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-27 20:00:00</th>\n", + " <th>1</th>\n", + " <td>100.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-28 00:00:00</th>\n", + " <th>1</th>\n", + " <td>99.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-28 04:00:00</th>\n", + " <th>2</th>\n", + " <td>98.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-28 08:00:00</th>\n", + " <th>2</th>\n", + " <td>99.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-28 12:00:00</th>\n", + " <th>3</th>\n", + " <td>98.5</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2173-07-28 16:00:00</th>\n", + " <th>3</th>\n", + " <td>99.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>100117</th>\n", + " <th>2166-04-30 21:39:00</th>\n", + " <th>0</th>\n", + " <td>99.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>2000 rows × 4 columns</p>\n", + "</div>" + ], + "text/plain": [ + "label temperature body \\\n", + "status known \n", + "variable_type qn \n", + "units degF \n", + "description 223761 678 223762(degC) \n", + "id datetime seg_id \n", + "100001 2117-09-11 13:48:00 0 98.0 NaN NaN \n", + " 2117-09-11 16:00:00 0 97.9 NaN NaN \n", + " 2117-09-11 19:00:00 0 99.5 NaN NaN \n", + " 2117-09-11 22:00:00 1 100.0 NaN NaN \n", + " 2117-09-12 01:00:00 1 99.9 NaN NaN \n", + " 2117-09-12 04:00:00 1 97.7 NaN NaN \n", + " 2117-09-12 08:00:00 2 97.8 NaN NaN \n", + " 2117-09-12 12:00:00 2 97.5 NaN NaN \n", + " 2117-09-12 19:00:00 3 99.8 NaN NaN \n", + " 2117-09-13 00:00:00 3 99.7 NaN NaN \n", + " 2117-09-13 04:00:00 4 99.3 NaN NaN \n", + " 2117-09-13 08:00:00 4 99.4 NaN NaN \n", + " 2117-09-13 12:00:00 4 98.8 NaN NaN \n", + " 2117-09-13 16:00:00 5 99.3 NaN NaN \n", + " 2117-09-13 22:00:00 5 99.9 NaN NaN \n", + " 2117-09-14 00:00:00 6 99.4 NaN NaN \n", + " 2117-09-14 04:00:00 6 99.6 NaN NaN \n", + " 2117-09-14 08:00:00 6 99.0 NaN NaN \n", + " 2117-09-14 13:00:00 7 98.0 NaN NaN \n", + " 2117-09-14 19:00:00 7 99.5 NaN NaN \n", + " 2117-09-15 00:00:00 8 99.6 NaN NaN \n", + " 2117-09-15 08:00:00 9 98.3 NaN NaN \n", + " 2117-09-15 12:00:00 9 97.8 NaN NaN \n", + " 2117-09-15 16:00:00 10 98.6 NaN NaN \n", + "100003 2150-04-17 20:31:00 0 95.9 NaN NaN \n", + " 2150-04-17 22:00:00 0 98.2 NaN NaN \n", + " 2150-04-18 00:00:00 0 97.4 NaN NaN \n", + " 2150-04-18 04:00:00 1 98.0 NaN NaN \n", + " 2150-04-18 08:00:00 1 97.4 NaN NaN \n", + " 2150-04-18 11:18:00 1 96.3 NaN NaN \n", + "... ... ... ... \n", + "100114 2157-09-19 18:15:00 3 NaN 98.400002 NaN \n", + " 2157-09-19 18:30:00 3 NaN 98.300003 NaN \n", + " 2157-09-19 20:00:00 3 NaN 98.400002 NaN \n", + " 2157-09-19 23:00:00 3 NaN 98.400002 NaN \n", + " 2157-09-20 00:00:00 3 NaN 98.599998 NaN \n", + " 2157-09-20 01:00:00 3 NaN 98.000000 NaN \n", + " 2157-09-20 01:15:00 4 NaN 98.199997 NaN \n", + " 2157-09-20 02:00:00 4 NaN 97.099998 NaN \n", + " 2157-09-20 06:00:00 4 NaN 98.000000 NaN \n", + " 2157-09-20 08:00:00 4 NaN 96.699997 NaN \n", + " 2157-09-20 09:15:00 4 NaN 96.900002 NaN \n", + " 2157-09-20 09:30:00 4 NaN 97.000000 NaN \n", + " 2157-09-20 10:00:00 4 NaN 96.900002 NaN \n", + " 2157-09-20 12:00:00 5 NaN 97.199997 NaN \n", + " 2157-09-20 15:00:00 5 NaN 98.400002 NaN \n", + " 2157-09-20 18:00:00 5 NaN 97.800003 NaN \n", + "100116 2173-07-27 05:13:00 0 98.9 NaN NaN \n", + " 2173-07-27 08:00:00 0 100.0 NaN NaN \n", + " 2173-07-27 09:30:00 0 99.7 NaN NaN \n", + " 2173-07-27 11:00:00 0 98.7 NaN NaN \n", + " 2173-07-27 14:25:00 0 100.4 NaN NaN \n", + " 2173-07-27 16:30:00 1 100.3 NaN NaN \n", + " 2173-07-27 18:00:00 1 99.9 NaN NaN \n", + " 2173-07-27 20:00:00 1 100.3 NaN NaN \n", + " 2173-07-28 00:00:00 1 99.7 NaN NaN \n", + " 2173-07-28 04:00:00 2 98.5 NaN NaN \n", + " 2173-07-28 08:00:00 2 99.4 NaN NaN \n", + " 2173-07-28 12:00:00 3 98.5 NaN NaN \n", + " 2173-07-28 16:00:00 3 99.4 NaN NaN \n", + "100117 2166-04-30 21:39:00 0 99.7 NaN NaN \n", + "\n", + "label \n", + "status \n", + "variable_type \n", + "units \n", + "description 676(degC) \n", + "id datetime seg_id \n", + "100001 2117-09-11 13:48:00 0 NaN \n", + " 2117-09-11 16:00:00 0 NaN \n", + " 2117-09-11 19:00:00 0 NaN \n", + " 2117-09-11 22:00:00 1 NaN \n", + " 2117-09-12 01:00:00 1 NaN \n", + " 2117-09-12 04:00:00 1 NaN \n", + " 2117-09-12 08:00:00 2 NaN \n", + " 2117-09-12 12:00:00 2 NaN \n", + " 2117-09-12 19:00:00 3 NaN \n", + " 2117-09-13 00:00:00 3 NaN \n", + " 2117-09-13 04:00:00 4 NaN \n", + " 2117-09-13 08:00:00 4 NaN \n", + " 2117-09-13 12:00:00 4 NaN \n", + " 2117-09-13 16:00:00 5 NaN \n", + " 2117-09-13 22:00:00 5 NaN \n", + " 2117-09-14 00:00:00 6 NaN \n", + " 2117-09-14 04:00:00 6 NaN \n", + " 2117-09-14 08:00:00 6 NaN \n", + " 2117-09-14 13:00:00 7 NaN \n", + " 2117-09-14 19:00:00 7 NaN \n", + " 2117-09-15 00:00:00 8 NaN \n", + " 2117-09-15 08:00:00 9 NaN \n", + " 2117-09-15 12:00:00 9 NaN \n", + " 2117-09-15 16:00:00 10 NaN \n", + "100003 2150-04-17 20:31:00 0 NaN \n", + " 2150-04-17 22:00:00 0 NaN \n", + " 2150-04-18 00:00:00 0 NaN \n", + " 2150-04-18 04:00:00 1 NaN \n", + " 2150-04-18 08:00:00 1 NaN \n", + " 2150-04-18 11:18:00 1 NaN \n", + "... ... \n", + "100114 2157-09-19 18:15:00 3 NaN \n", + " 2157-09-19 18:30:00 3 NaN \n", + " 2157-09-19 20:00:00 3 NaN \n", + " 2157-09-19 23:00:00 3 NaN \n", + " 2157-09-20 00:00:00 3 NaN \n", + " 2157-09-20 01:00:00 3 NaN \n", + " 2157-09-20 01:15:00 4 NaN \n", + " 2157-09-20 02:00:00 4 NaN \n", + " 2157-09-20 06:00:00 4 NaN \n", + " 2157-09-20 08:00:00 4 NaN \n", + " 2157-09-20 09:15:00 4 NaN \n", + " 2157-09-20 09:30:00 4 NaN \n", + " 2157-09-20 10:00:00 4 NaN \n", + " 2157-09-20 12:00:00 5 NaN \n", + " 2157-09-20 15:00:00 5 NaN \n", + " 2157-09-20 18:00:00 5 NaN \n", + "100116 2173-07-27 05:13:00 0 NaN \n", + " 2173-07-27 08:00:00 0 NaN \n", + " 2173-07-27 09:30:00 0 NaN \n", + " 2173-07-27 11:00:00 0 NaN \n", + " 2173-07-27 14:25:00 0 NaN \n", + " 2173-07-27 16:30:00 1 NaN \n", + " 2173-07-27 18:00:00 1 NaN \n", + " 2173-07-27 20:00:00 1 NaN \n", + " 2173-07-28 00:00:00 1 NaN \n", + " 2173-07-28 04:00:00 2 NaN \n", + " 2173-07-28 08:00:00 2 NaN \n", + " 2173-07-28 12:00:00 3 NaN \n", + " 2173-07-28 16:00:00 3 NaN \n", + "100117 2166-04-30 21:39:00 0 NaN \n", + "\n", + "[2000 rows x 4 columns]" + ] + }, + "execution_count": 266, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_temp_periodic = periodic.transform(df_temp_combined.head(2000))\n", + "df_temp_periodic[df_temp_periodic.index.get_level_values('seg_id') > -1]" + ] + }, + { + "cell_type": "code", + "execution_count": 252, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import utils\n", + "import mimic\n", + "import transformers\n", + "from sklearn.pipeline import Pipeline\n", + "import icu_data_defs\n", + "import units\n", + "import segmenting\n", + "from sklearn_pandas import DataFrameMapper\n", + "import constants\n", + "import features" + ] + }, + { + "cell_type": "code", + "execution_count": 251, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "hdf5_fname = 'data/mimic_data'\n", + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "df_cleaned" + ] + }, + { + "cell_type": "code", + "execution_count": 249, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "end_dt = df_temp_combined.iloc[:,0].groupby(level='id').apply(lambda x:x.sample(1))\n", + "end_dt = end_dt.reset_index(level=0,drop=True).reset_index(level=1,drop=False).iloc[:,0]\n", + "all_before = segmenting.all_before(end_dt,df_context)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Feature creation" + ] + }, + { + "cell_type": "code", + "execution_count": 247, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "import utils\n", + "import transformers\n", + "from sklearn.pipeline import Pipeline\n", + "import units\n", + "from sklearn_pandas import DataFrameMapper\n", + "import constants\n", + "import features" + ] + }, + { + "cell_type": "code", + "execution_count": 248, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "ename": "ImportError", + "evalue": "cannot import name CUSTOM_FILTER", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mImportError\u001b[0m Traceback (most recent call last)", + "\u001b[1;32m<ipython-input-248-bae7a29e5c29>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mfeatures\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 2\u001b[0m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mutils\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3\u001b[0m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0munits\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 4\u001b[0m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mconstants\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 5\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\features.pyc\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[0;32m 1\u001b[0m \u001b[1;32mfrom\u001b[0m \u001b[0msklearn\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mbase\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mTransformerMixin\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mBaseEstimator\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 2\u001b[0m \u001b[1;32mfrom\u001b[0m \u001b[0msklearn\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mpipeline\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mFeatureUnion\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 3\u001b[1;33m \u001b[1;32mfrom\u001b[0m \u001b[0mconstants\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mcolumn_names\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mSEG_ID\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mNO_SEGMENT\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mALL\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mCUSTOM_FILTER\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 4\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mnumpy\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 5\u001b[0m \u001b[1;32mfrom\u001b[0m \u001b[0msklearn_pandas\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mDataFrameMapper\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;31mImportError\u001b[0m: cannot import name CUSTOM_FILTER" + ] + } + ], + "source": [ + "reload(features)\n", + "reload(utils)\n", + "reload(units)\n", + "reload(constants)\n", + "\n", + "df = df_temp_all_before\n", + "ureg = units.MedicalUreg()\n", + "\n", + "\n", + "\n", + "def summable_filter(df):\n", + " filter_func= lambda x: (ureg.is_volume(str(x[-2])) or ureg.is_mass(str(x[-2]))) and (x[0] != 'weight body')\n", + " return df.loc[:,df.columns.map(filter_func)]\n", + "\n", + "feature_tuples = [\n", + " ('MEAN',features.segment_mean(),ALL),\n", + " ('STD',features.segment_std(),ALL),\n", + " ('COUNT',features.segment_count(),ALL),\n", + " ('LAST',features.segment_last(),ALL),\n", + " ('SUM',features.segment_sum(),{constants.CUSTOM_FILTER:summable_filter})\n", + "]\n", + "\n", + "mapped_ft = features.make_mapper(feature_tuples,df)" + ] + }, + { + "cell_type": "code", + "execution_count": 232, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "feature_df = mapped_ft.transform(df)" + ] + }, + { + "cell_type": "code", + "execution_count": 233, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>temperature body_degF_223761_MEAN</th>\n", + " <th>temperature body_degF_678_MEAN</th>\n", + " <th>temperature body_degC_223762_MEAN</th>\n", + " <th>temperature body_degC_676_MEAN</th>\n", + " <th>temperature body_degF_223761_STD</th>\n", + " <th>temperature body_degF_678_STD</th>\n", + " <th>temperature body_degC_223762_STD</th>\n", + " <th>temperature body_degC_676_STD</th>\n", + " <th>temperature body_degF_223761_COUNT</th>\n", + " <th>temperature body_degF_678_COUNT</th>\n", + " <th>temperature body_degC_223762_COUNT</th>\n", + " <th>temperature body_degC_676_COUNT</th>\n", + " <th>temperature body_degF_223761_LAST</th>\n", + " <th>temperature body_degF_678_LAST</th>\n", + " <th>temperature body_degC_223762_LAST</th>\n", + " <th>temperature body_degC_676_LAST</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>98.537500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.064945</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>8.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>97.166667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.167619</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>3.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>95.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>NaN</td>\n", + " <td>97.533334</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.607729</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>21.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.591667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.466263</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>12.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>95.699997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>98.100000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.458258</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>3.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>98.550000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.036822</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>6.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>100.2</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>98.380000</td>\n", + " <td>NaN</td>\n", + " <td>36.511765</td>\n", + " <td>NaN</td>\n", + " <td>0.641872</td>\n", + " <td>NaN</td>\n", + " <td>0.790767</td>\n", + " <td>NaN</td>\n", + " <td>5.0</td>\n", + " <td>0.0</td>\n", + " <td>34.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>34.5</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7</th>\n", + " <td>NaN</td>\n", + " <td>100.649998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.777816</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>2.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>101.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8</th>\n", + " <td>97.975000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.875032</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>12.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>97.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>9</th>\n", + " <td>96.050000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.777817</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>96.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>10</th>\n", + " <td>NaN</td>\n", + " <td>98.536364</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.492489</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>11.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>98.500000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>11</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.378571</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.260705</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>14.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.6</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>12</th>\n", + " <td>99.466667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.495650</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>12.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>13</th>\n", + " <td>NaN</td>\n", + " <td>99.099998</td>\n", + " <td>NaN</td>\n", + " <td>36.766037</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.374646</td>\n", + " <td>0.0</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>106.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.599998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>14</th>\n", + " <td>NaN</td>\n", + " <td>95.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>95.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>15</th>\n", + " <td>98.500000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.141421</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>16</th>\n", + " <td>100.772222</td>\n", + " <td>NaN</td>\n", + " <td>37.719512</td>\n", + " <td>NaN</td>\n", + " <td>1.075287</td>\n", + " <td>NaN</td>\n", + " <td>0.281265</td>\n", + " <td>NaN</td>\n", + " <td>18.0</td>\n", + " <td>0.0</td>\n", + " <td>41.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.5</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>17</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.193750</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.401560</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>32.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.799999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>18</th>\n", + " <td>99.345455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.864975</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>33.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>19</th>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>20</th>\n", + " <td>98.312500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.022986</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>16.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>97.6</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>21</th>\n", + " <td>97.760000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.585662</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>5.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>22</th>\n", + " <td>NaN</td>\n", + " <td>98.445455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.849254</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>22.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>23</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>34.990909</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>4.190574</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>11.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>28.4</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>24</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.799999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>1.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.799999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25</th>\n", + " <td>NaN</td>\n", + " <td>97.320000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.277491</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>5.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>26</th>\n", + " <td>NaN</td>\n", + " <td>96.700000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.754119</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>24.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>27</th>\n", + " <td>NaN</td>\n", + " <td>96.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.787487</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>10.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>94.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>28</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.847368</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.300681</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>19.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.200001</td>\n", + " </tr>\n", + " <tr>\n", + " <th>29</th>\n", + " <td>96.525000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.450000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>4.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>96.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44216</th>\n", + " <td>NaN</td>\n", + " <td>98.302703</td>\n", + " <td>NaN</td>\n", + " <td>37.021739</td>\n", + " <td>NaN</td>\n", + " <td>1.047082</td>\n", + " <td>NaN</td>\n", + " <td>0.997311</td>\n", + " <td>0.0</td>\n", + " <td>37.0</td>\n", + " <td>0.0</td>\n", + " <td>46.0</td>\n", + " <td>NaN</td>\n", + " <td>96.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44217</th>\n", + " <td>98.475000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.081280</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>4.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>97.1</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44218</th>\n", + " <td>96.275000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.420034</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>8.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>96.3</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44219</th>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44220</th>\n", + " <td>NaN</td>\n", + " <td>95.740001</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.021275</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>5.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>94.099998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44221</th>\n", + " <td>NaN</td>\n", + " <td>97.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.672309</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>5.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.099998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44222</th>\n", + " <td>99.240000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.512835</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>5.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>99.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44223</th>\n", + " <td>98.450000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.070711</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>2.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44224</th>\n", + " <td>NaN</td>\n", + " <td>98.130000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.531351</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>10.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44225</th>\n", + " <td>NaN</td>\n", + " <td>97.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.199997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>4.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44226</th>\n", + " <td>99.753333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.765195</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>15.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.7</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44227</th>\n", + " <td>NaN</td>\n", + " <td>98.071875</td>\n", + " <td>NaN</td>\n", + " <td>37.449181</td>\n", + " <td>NaN</td>\n", + " <td>0.944674</td>\n", + " <td>NaN</td>\n", + " <td>0.920982</td>\n", + " <td>0.0</td>\n", + " <td>32.0</td>\n", + " <td>0.0</td>\n", + " <td>61.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>34.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44228</th>\n", + " <td>NaN</td>\n", + " <td>100.526316</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.175605</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>19.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>98.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44229</th>\n", + " <td>97.580000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.740570</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>10.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>96.9</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44230</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.443518</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.332443</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>108.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>37.299999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44231</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.071429</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.239964</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>14.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>35.599998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44232</th>\n", + " <td>98.484375</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.070456</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>32.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>100.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44233</th>\n", + " <td>NaN</td>\n", + " <td>100.278462</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.300803</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>130.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>97.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44234</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.173333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.688131</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>15.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>35.0</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44235</th>\n", + " <td>NaN</td>\n", + " <td>97.074999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.056330</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>4.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>95.599998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44236</th>\n", + " <td>97.977778</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.032930</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>9.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>98.4</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44237</th>\n", + " <td>NaN</td>\n", + " <td>97.485713</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.977118</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>7.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>95.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44238</th>\n", + " <td>NaN</td>\n", + " <td>97.264285</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.759157</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>14.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>96.599998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44239</th>\n", + " <td>NaN</td>\n", + " <td>95.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.565688</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>2.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>95.000000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44240</th>\n", + " <td>95.800000</td>\n", + " <td>NaN</td>\n", + " <td>34.800000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>1.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>34.8</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44241</th>\n", + " <td>NaN</td>\n", + " <td>97.670000</td>\n", + " <td>NaN</td>\n", + " <td>37.420725</td>\n", + " <td>NaN</td>\n", + " <td>0.668415</td>\n", + " <td>NaN</td>\n", + " <td>0.378023</td>\n", + " <td>0.0</td>\n", + " <td>10.0</td>\n", + " <td>0.0</td>\n", + " <td>193.0</td>\n", + " <td>NaN</td>\n", + " <td>98.699997</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44242</th>\n", + " <td>NaN</td>\n", + " <td>98.980953</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.933605</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.0</td>\n", + " <td>21.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>NaN</td>\n", + " <td>99.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44243</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>35.750000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>0.919241</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>2.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>35.099998</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44244</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>36.176191</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.159700</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>21.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>34.700001</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44245</th>\n", + " <td>98.655000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>1.147297</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>20.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>97.8</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>44246 rows × 16 columns</p>\n", + "</div>" + ], + "text/plain": [ + " temperature body_degF_223761_MEAN temperature body_degF_678_MEAN \\\n", + "0 98.537500 NaN \n", + "1 97.166667 NaN \n", + "2 NaN 97.533334 \n", + "3 NaN 98.591667 \n", + "4 98.100000 NaN \n", + "5 98.550000 NaN \n", + "6 98.380000 NaN \n", + "7 NaN 100.649998 \n", + "8 97.975000 NaN \n", + "9 96.050000 NaN \n", + "10 NaN 98.536364 \n", + "11 NaN NaN \n", + "12 99.466667 NaN \n", + "13 NaN 99.099998 \n", + "14 NaN 95.300003 \n", + "15 98.500000 NaN \n", + "16 100.772222 NaN \n", + "17 NaN NaN \n", + "18 99.345455 NaN \n", + "19 NaN 98.800003 \n", + "20 98.312500 NaN \n", + "21 97.760000 NaN \n", + "22 NaN 98.445455 \n", + "23 NaN NaN \n", + "24 NaN NaN \n", + "25 NaN 97.320000 \n", + "26 NaN 96.700000 \n", + "27 NaN 96.920000 \n", + "28 NaN NaN \n", + "29 96.525000 NaN \n", + "... ... ... \n", + "44216 NaN 98.302703 \n", + "44217 98.475000 NaN \n", + "44218 96.275000 NaN \n", + "44219 NaN 97.800003 \n", + "44220 NaN 95.740001 \n", + "44221 NaN 97.920000 \n", + "44222 99.240000 NaN \n", + "44223 98.450000 NaN \n", + "44224 NaN 98.130000 \n", + "44225 NaN 97.900002 \n", + "44226 99.753333 NaN \n", + "44227 NaN 98.071875 \n", + "44228 NaN 100.526316 \n", + "44229 97.580000 NaN \n", + "44230 NaN NaN \n", + "44231 NaN NaN \n", + "44232 98.484375 NaN \n", + "44233 NaN 100.278462 \n", + "44234 NaN NaN \n", + "44235 NaN 97.074999 \n", + "44236 97.977778 NaN \n", + "44237 NaN 97.485713 \n", + "44238 NaN 97.264285 \n", + "44239 NaN 95.400002 \n", + "44240 95.800000 NaN \n", + "44241 NaN 97.670000 \n", + "44242 NaN 98.980953 \n", + "44243 NaN NaN \n", + "44244 NaN NaN \n", + "44245 98.655000 NaN \n", + "\n", + " temperature body_degC_223762_MEAN temperature body_degC_676_MEAN \\\n", + "0 NaN NaN \n", + "1 NaN NaN \n", + "2 NaN NaN \n", + "3 NaN NaN \n", + "4 NaN NaN \n", + "5 NaN NaN \n", + "6 36.511765 NaN \n", + "7 NaN NaN \n", + "8 NaN NaN \n", + "9 NaN NaN \n", + "10 NaN NaN \n", + "11 36.378571 NaN \n", + "12 NaN NaN \n", + "13 NaN 36.766037 \n", + "14 NaN NaN \n", + "15 NaN NaN \n", + "16 37.719512 NaN \n", + "17 NaN 37.193750 \n", + "18 NaN NaN \n", + "19 NaN NaN \n", + "20 NaN NaN \n", + "21 NaN NaN \n", + "22 NaN NaN \n", + "23 34.990909 NaN \n", + "24 NaN 36.799999 \n", + "25 NaN NaN \n", + "26 NaN NaN \n", + "27 NaN NaN \n", + "28 NaN 36.847368 \n", + "29 NaN NaN \n", + "... ... ... \n", + "44216 NaN 37.021739 \n", + "44217 NaN NaN \n", + "44218 NaN NaN \n", + "44219 NaN NaN \n", + "44220 NaN NaN \n", + "44221 NaN NaN \n", + "44222 NaN NaN \n", + "44223 NaN NaN \n", + "44224 NaN NaN \n", + "44225 NaN NaN \n", + "44226 NaN NaN \n", + "44227 NaN 37.449181 \n", + "44228 NaN NaN \n", + "44229 NaN NaN \n", + "44230 NaN 37.443518 \n", + "44231 NaN 36.071429 \n", + "44232 NaN NaN \n", + "44233 NaN NaN \n", + "44234 36.173333 NaN \n", + "44235 NaN NaN \n", + "44236 NaN NaN \n", + "44237 NaN NaN \n", + "44238 NaN NaN \n", + "44239 NaN NaN \n", + "44240 34.800000 NaN \n", + "44241 NaN 37.420725 \n", + "44242 NaN NaN \n", + "44243 NaN 35.750000 \n", + "44244 NaN 36.176191 \n", + "44245 NaN NaN \n", + "\n", + " temperature body_degF_223761_STD temperature body_degF_678_STD \\\n", + "0 1.064945 NaN \n", + "1 1.167619 NaN \n", + "2 NaN 0.607729 \n", + "3 NaN 1.466263 \n", + "4 0.458258 NaN \n", + "5 1.036822 NaN \n", + "6 0.641872 NaN \n", + "7 NaN 0.777816 \n", + "8 0.875032 NaN \n", + "9 0.777817 NaN \n", + "10 NaN 0.492489 \n", + "11 NaN NaN \n", + "12 1.495650 NaN \n", + "13 NaN NaN \n", + "14 NaN NaN \n", + "15 0.141421 NaN \n", + "16 1.075287 NaN \n", + "17 NaN NaN \n", + "18 0.864975 NaN \n", + "19 NaN NaN \n", + "20 1.022986 NaN \n", + "21 0.585662 NaN \n", + "22 NaN 1.849254 \n", + "23 NaN NaN \n", + "24 NaN NaN \n", + "25 NaN 0.277491 \n", + "26 NaN 0.754119 \n", + "27 NaN 1.787487 \n", + "28 NaN NaN \n", + "29 0.450000 NaN \n", + "... ... ... \n", + "44216 NaN 1.047082 \n", + "44217 1.081280 NaN \n", + "44218 0.420034 NaN \n", + "44219 NaN NaN \n", + "44220 NaN 1.021275 \n", + "44221 NaN 0.672309 \n", + "44222 0.512835 NaN \n", + "44223 0.070711 NaN \n", + "44224 NaN 0.531351 \n", + "44225 NaN 0.199997 \n", + "44226 0.765195 NaN \n", + "44227 NaN 0.944674 \n", + "44228 NaN 1.175605 \n", + "44229 0.740570 NaN \n", + "44230 NaN NaN \n", + "44231 NaN NaN \n", + "44232 1.070456 NaN \n", + "44233 NaN 1.300803 \n", + "44234 NaN NaN \n", + "44235 NaN 1.056330 \n", + "44236 1.032930 NaN \n", + "44237 NaN 0.977118 \n", + "44238 NaN 0.759157 \n", + "44239 NaN 0.565688 \n", + "44240 NaN NaN \n", + "44241 NaN 0.668415 \n", + "44242 NaN 0.933605 \n", + "44243 NaN NaN \n", + "44244 NaN NaN \n", + "44245 1.147297 NaN \n", + "\n", + " temperature body_degC_223762_STD temperature body_degC_676_STD \\\n", + "0 NaN NaN \n", + "1 NaN NaN \n", + "2 NaN NaN \n", + "3 NaN NaN \n", + "4 NaN NaN \n", + "5 NaN NaN \n", + "6 0.790767 NaN \n", + "7 NaN NaN \n", + "8 NaN NaN \n", + "9 NaN NaN \n", + "10 NaN NaN \n", + "11 0.260705 NaN \n", + "12 NaN NaN \n", + "13 NaN 0.374646 \n", + "14 NaN NaN \n", + "15 NaN NaN \n", + "16 0.281265 NaN \n", + "17 NaN 0.401560 \n", + "18 NaN NaN \n", + "19 NaN NaN \n", + "20 NaN NaN \n", + "21 NaN NaN \n", + "22 NaN NaN \n", + "23 4.190574 NaN \n", + "24 NaN NaN \n", + "25 NaN NaN \n", + "26 NaN NaN \n", + "27 NaN NaN \n", + "28 NaN 0.300681 \n", + "29 NaN NaN \n", + "... ... ... \n", + "44216 NaN 0.997311 \n", + "44217 NaN NaN \n", + "44218 NaN NaN \n", + "44219 NaN NaN \n", + "44220 NaN NaN \n", + "44221 NaN NaN \n", + "44222 NaN NaN \n", + "44223 NaN NaN \n", + "44224 NaN NaN \n", + "44225 NaN NaN \n", + "44226 NaN NaN \n", + "44227 NaN 0.920982 \n", + "44228 NaN NaN \n", + "44229 NaN NaN \n", + "44230 NaN 0.332443 \n", + "44231 NaN 0.239964 \n", + "44232 NaN NaN \n", + "44233 NaN NaN \n", + "44234 0.688131 NaN \n", + "44235 NaN NaN \n", + "44236 NaN NaN \n", + "44237 NaN NaN \n", + "44238 NaN NaN \n", + "44239 NaN NaN \n", + "44240 NaN NaN \n", + "44241 NaN 0.378023 \n", + "44242 NaN NaN \n", + "44243 NaN 0.919241 \n", + "44244 NaN 1.159700 \n", + "44245 NaN NaN \n", + "\n", + " temperature body_degF_223761_COUNT temperature body_degF_678_COUNT \\\n", + "0 8.0 0.0 \n", + "1 3.0 0.0 \n", + "2 0.0 21.0 \n", + "3 0.0 12.0 \n", + "4 3.0 0.0 \n", + "5 6.0 0.0 \n", + "6 5.0 0.0 \n", + "7 0.0 2.0 \n", + "8 12.0 0.0 \n", + "9 2.0 0.0 \n", + "10 0.0 11.0 \n", + "11 0.0 0.0 \n", + "12 12.0 0.0 \n", + "13 0.0 1.0 \n", + "14 0.0 1.0 \n", + "15 2.0 0.0 \n", + "16 18.0 0.0 \n", + "17 0.0 0.0 \n", + "18 33.0 0.0 \n", + "19 0.0 1.0 \n", + "20 16.0 0.0 \n", + "21 5.0 0.0 \n", + "22 0.0 22.0 \n", + "23 0.0 0.0 \n", + "24 0.0 0.0 \n", + "25 0.0 5.0 \n", + "26 0.0 24.0 \n", + "27 0.0 10.0 \n", + "28 0.0 0.0 \n", + "29 4.0 0.0 \n", + "... ... ... \n", + "44216 0.0 37.0 \n", + "44217 4.0 0.0 \n", + "44218 8.0 0.0 \n", + "44219 0.0 1.0 \n", + "44220 0.0 5.0 \n", + "44221 0.0 5.0 \n", + "44222 5.0 0.0 \n", + "44223 2.0 0.0 \n", + "44224 0.0 10.0 \n", + "44225 0.0 4.0 \n", + "44226 15.0 0.0 \n", + "44227 0.0 32.0 \n", + "44228 0.0 19.0 \n", + "44229 10.0 0.0 \n", + "44230 0.0 0.0 \n", + "44231 0.0 0.0 \n", + "44232 32.0 0.0 \n", + "44233 0.0 130.0 \n", + "44234 0.0 0.0 \n", + "44235 0.0 4.0 \n", + "44236 9.0 0.0 \n", + "44237 0.0 7.0 \n", + "44238 0.0 14.0 \n", + "44239 0.0 2.0 \n", + "44240 1.0 0.0 \n", + "44241 0.0 10.0 \n", + "44242 0.0 21.0 \n", + "44243 0.0 0.0 \n", + "44244 0.0 0.0 \n", + "44245 20.0 0.0 \n", + "\n", + " temperature body_degC_223762_COUNT temperature body_degC_676_COUNT \\\n", + "0 0.0 0.0 \n", + "1 0.0 0.0 \n", + "2 0.0 0.0 \n", + "3 0.0 0.0 \n", + "4 0.0 0.0 \n", + "5 0.0 0.0 \n", + "6 34.0 0.0 \n", + "7 0.0 0.0 \n", + "8 0.0 0.0 \n", + "9 0.0 0.0 \n", + "10 0.0 0.0 \n", + "11 14.0 0.0 \n", + "12 0.0 0.0 \n", + "13 0.0 106.0 \n", + "14 0.0 0.0 \n", + "15 0.0 0.0 \n", + "16 41.0 0.0 \n", + "17 0.0 32.0 \n", + "18 0.0 0.0 \n", + "19 0.0 0.0 \n", + "20 0.0 0.0 \n", + "21 0.0 0.0 \n", + "22 0.0 0.0 \n", + "23 11.0 0.0 \n", + "24 0.0 1.0 \n", + "25 0.0 0.0 \n", + "26 0.0 0.0 \n", + "27 0.0 0.0 \n", + "28 0.0 19.0 \n", + "29 0.0 0.0 \n", + "... ... ... \n", + "44216 0.0 46.0 \n", + "44217 0.0 0.0 \n", + "44218 0.0 0.0 \n", + "44219 0.0 0.0 \n", + "44220 0.0 0.0 \n", + "44221 0.0 0.0 \n", + "44222 0.0 0.0 \n", + "44223 0.0 0.0 \n", + "44224 0.0 0.0 \n", + "44225 0.0 0.0 \n", + "44226 0.0 0.0 \n", + "44227 0.0 61.0 \n", + "44228 0.0 0.0 \n", + "44229 0.0 0.0 \n", + "44230 0.0 108.0 \n", + "44231 0.0 14.0 \n", + "44232 0.0 0.0 \n", + "44233 0.0 0.0 \n", + "44234 15.0 0.0 \n", + "44235 0.0 0.0 \n", + "44236 0.0 0.0 \n", + "44237 0.0 0.0 \n", + "44238 0.0 0.0 \n", + "44239 0.0 0.0 \n", + "44240 1.0 0.0 \n", + "44241 0.0 193.0 \n", + "44242 0.0 0.0 \n", + "44243 0.0 2.0 \n", + "44244 0.0 21.0 \n", + "44245 0.0 0.0 \n", + "\n", + " temperature body_degF_223761_LAST temperature body_degF_678_LAST \\\n", + "0 98.0 NaN \n", + "1 95.9 NaN \n", + "2 NaN 97.000000 \n", + "3 NaN 95.699997 \n", + "4 98.6 NaN \n", + "5 100.2 NaN \n", + "6 NaN NaN \n", + "7 NaN 101.199997 \n", + "8 97.4 NaN \n", + "9 96.6 NaN \n", + "10 NaN 98.500000 \n", + "11 NaN NaN \n", + "12 98.8 NaN \n", + "13 NaN NaN \n", + "14 NaN 95.300003 \n", + "15 98.6 NaN \n", + "16 NaN NaN \n", + "17 NaN NaN \n", + "18 98.6 NaN \n", + "19 NaN 98.800003 \n", + "20 97.6 NaN \n", + "21 97.8 NaN \n", + "22 NaN 97.800003 \n", + "23 NaN NaN \n", + "24 NaN NaN \n", + "25 NaN 97.199997 \n", + "26 NaN 97.000000 \n", + "27 NaN 94.000000 \n", + "28 NaN NaN \n", + "29 96.9 NaN \n", + "... ... ... \n", + "44216 NaN 96.000000 \n", + "44217 97.1 NaN \n", + "44218 96.3 NaN \n", + "44219 NaN 97.800003 \n", + "44220 NaN 94.099998 \n", + "44221 NaN 97.099998 \n", + "44222 99.8 NaN \n", + "44223 98.4 NaN \n", + "44224 NaN 97.800003 \n", + "44225 NaN 97.800003 \n", + "44226 98.7 NaN \n", + "44227 NaN NaN \n", + "44228 NaN 98.000000 \n", + "44229 96.9 NaN \n", + "44230 NaN NaN \n", + "44231 NaN NaN \n", + "44232 100.0 NaN \n", + "44233 NaN 97.900002 \n", + "44234 NaN NaN \n", + "44235 NaN 95.599998 \n", + "44236 98.4 NaN \n", + "44237 NaN 95.900002 \n", + "44238 NaN 96.599998 \n", + "44239 NaN 95.000000 \n", + "44240 NaN NaN \n", + "44241 NaN 98.699997 \n", + "44242 NaN 99.400002 \n", + "44243 NaN NaN \n", + "44244 NaN NaN \n", + "44245 97.8 NaN \n", + "\n", + " temperature body_degC_223762_LAST temperature body_degC_676_LAST \n", + "0 NaN NaN \n", + "1 NaN NaN \n", + "2 NaN NaN \n", + "3 NaN NaN \n", + "4 NaN NaN \n", + "5 NaN NaN \n", + "6 34.5 NaN \n", + "7 NaN NaN \n", + "8 NaN NaN \n", + "9 NaN NaN \n", + "10 NaN NaN \n", + "11 36.6 NaN \n", + "12 NaN NaN \n", + "13 NaN 36.599998 \n", + "14 NaN NaN \n", + "15 NaN NaN \n", + "16 37.5 NaN \n", + "17 NaN 36.799999 \n", + "18 NaN NaN \n", + "19 NaN NaN \n", + "20 NaN NaN \n", + "21 NaN NaN \n", + "22 NaN NaN \n", + "23 28.4 NaN \n", + "24 NaN 36.799999 \n", + "25 NaN NaN \n", + "26 NaN NaN \n", + "27 NaN NaN \n", + "28 NaN 36.200001 \n", + "29 NaN NaN \n", + "... ... ... \n", + "44216 NaN NaN \n", + "44217 NaN NaN \n", + "44218 NaN NaN \n", + "44219 NaN NaN \n", + "44220 NaN NaN \n", + "44221 NaN NaN \n", + "44222 NaN NaN \n", + "44223 NaN NaN \n", + "44224 NaN NaN \n", + "44225 NaN NaN \n", + "44226 NaN NaN \n", + "44227 NaN 34.500000 \n", + "44228 NaN NaN \n", + "44229 NaN NaN \n", + "44230 NaN 37.299999 \n", + "44231 NaN 35.599998 \n", + "44232 NaN NaN \n", + "44233 NaN NaN \n", + "44234 35.0 NaN \n", + "44235 NaN NaN \n", + "44236 NaN NaN \n", + "44237 NaN NaN \n", + "44238 NaN NaN \n", + "44239 NaN NaN \n", + "44240 34.8 NaN \n", + "44241 NaN NaN \n", + "44242 NaN NaN \n", + "44243 NaN 35.099998 \n", + "44244 NaN 34.700001 \n", + "44245 NaN NaN \n", + "\n", + "[44246 rows x 16 columns]" + ] + }, + "execution_count": 233, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "feature_df" + ] + }, + { + "cell_type": "code", + "execution_count": 120, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "test_mapper_pipeline = Pipeline([\n", + " ('ft_mapper',mapped_ft)\n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": 121, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>temperature body_known_qn_degF_223761_MEAN</th>\n", + " <th>temperature body_known_qn_degF_678_MEAN</th>\n", + " <th>temperature body_known_qn_degF_223762(degC)_MEAN</th>\n", + " <th>temperature body_known_qn_degF_676(degC)_MEAN</th>\n", + " <th>temperature body_known_qn_degF_223761_STD</th>\n", + " <th>temperature body_known_qn_degF_678_STD</th>\n", + " <th>temperature body_known_qn_degF_223762(degC)_STD</th>\n", + " <th>temperature body_known_qn_degF_676(degC)_STD</th>\n", + " <th>temperature body_known_qn_degF_223761_COUNT</th>\n", + " <th>temperature body_known_qn_degF_678_COUNT</th>\n", + " <th>temperature body_known_qn_degF_223762(degC)_COUNT</th>\n", + " <th>temperature body_known_qn_degF_676(degC)_COUNT</th>\n", + " <th>temperature body_known_qn_degF_223761_LAST</th>\n", + " <th>temperature body_known_qn_degF_678_LAST</th>\n", + " <th>temperature body_known_qn_degF_223762(degC)_LAST</th>\n", + " <th>temperature body_known_qn_degF_676(degC)_LAST</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>98.537500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.537500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.537500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.537500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>97.166667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.166667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.166667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.166667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>NaN</td>\n", + " <td>97.533334</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.533334</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.533334</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.533334</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>NaN</td>\n", + " <td>98.591667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.591667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.591667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.591667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>98.100000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.100000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.100000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.100000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>98.550000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.550000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.550000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.550000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>6</th>\n", + " <td>98.380000</td>\n", + " <td>NaN</td>\n", + " <td>97.721177</td>\n", + " <td>NaN</td>\n", + " <td>98.380000</td>\n", + " <td>NaN</td>\n", + " <td>97.721177</td>\n", + " <td>NaN</td>\n", + " <td>98.380000</td>\n", + " <td>NaN</td>\n", + " <td>97.721177</td>\n", + " <td>NaN</td>\n", + " <td>98.380000</td>\n", + " <td>NaN</td>\n", + " <td>97.721177</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>7</th>\n", + " <td>NaN</td>\n", + " <td>100.649998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.649998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.649998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.649998</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>8</th>\n", + " <td>97.975000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.975000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.975000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.975000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>9</th>\n", + " <td>96.050000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.050000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.050000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.050000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>10</th>\n", + " <td>NaN</td>\n", + " <td>98.536364</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.536364</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.536364</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.536364</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>11</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.481429</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.481429</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.481429</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.481429</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>12</th>\n", + " <td>99.466667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.466667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.466667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.466667</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>13</th>\n", + " <td>NaN</td>\n", + " <td>99.099998</td>\n", + " <td>NaN</td>\n", + " <td>98.178868</td>\n", + " <td>NaN</td>\n", + " <td>99.099998</td>\n", + " <td>NaN</td>\n", + " <td>98.178868</td>\n", + " <td>NaN</td>\n", + " <td>99.099998</td>\n", + " <td>NaN</td>\n", + " <td>98.178868</td>\n", + " <td>NaN</td>\n", + " <td>99.099998</td>\n", + " <td>NaN</td>\n", + " <td>98.178868</td>\n", + " </tr>\n", + " <tr>\n", + " <th>14</th>\n", + " <td>NaN</td>\n", + " <td>95.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.300003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>15</th>\n", + " <td>98.500000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.500000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.500000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.500000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>16</th>\n", + " <td>100.772222</td>\n", + " <td>NaN</td>\n", + " <td>99.895122</td>\n", + " <td>NaN</td>\n", + " <td>100.772222</td>\n", + " <td>NaN</td>\n", + " <td>99.895122</td>\n", + " <td>NaN</td>\n", + " <td>100.772222</td>\n", + " <td>NaN</td>\n", + " <td>99.895122</td>\n", + " <td>NaN</td>\n", + " <td>100.772222</td>\n", + " <td>NaN</td>\n", + " <td>99.895122</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>17</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.948750</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.948750</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.948750</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.948750</td>\n", + " </tr>\n", + " <tr>\n", + " <th>18</th>\n", + " <td>99.345455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.345455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.345455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.345455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>19</th>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>20</th>\n", + " <td>98.312500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.312500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.312500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.312500</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>21</th>\n", + " <td>97.760000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.760000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.760000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.760000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>22</th>\n", + " <td>NaN</td>\n", + " <td>98.445455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.445455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.445455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.445455</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>23</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>94.983637</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>94.983637</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>94.983637</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>94.983637</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>24</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.239999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.239999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.239999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.239999</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25</th>\n", + " <td>NaN</td>\n", + " <td>97.320000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.320000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.320000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.320000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>26</th>\n", + " <td>NaN</td>\n", + " <td>96.700000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.700000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.700000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.700000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>27</th>\n", + " <td>NaN</td>\n", + " <td>96.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>28</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.325263</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.325263</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.325263</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.325263</td>\n", + " </tr>\n", + " <tr>\n", + " <th>29</th>\n", + " <td>96.525000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.525000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.525000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.525000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44216</th>\n", + " <td>NaN</td>\n", + " <td>98.302703</td>\n", + " <td>NaN</td>\n", + " <td>98.639131</td>\n", + " <td>NaN</td>\n", + " <td>98.302703</td>\n", + " <td>NaN</td>\n", + " <td>98.639131</td>\n", + " <td>NaN</td>\n", + " <td>98.302703</td>\n", + " <td>NaN</td>\n", + " <td>98.639131</td>\n", + " <td>NaN</td>\n", + " <td>98.302703</td>\n", + " <td>NaN</td>\n", + " <td>98.639131</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44217</th>\n", + " <td>98.475000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.475000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.475000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.475000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44218</th>\n", + " <td>96.275000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.275000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.275000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.275000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44219</th>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.800003</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44220</th>\n", + " <td>NaN</td>\n", + " <td>95.740001</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.740001</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.740001</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.740001</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44221</th>\n", + " <td>NaN</td>\n", + " <td>97.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.920000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44222</th>\n", + " <td>99.240000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.240000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.240000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.240000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44223</th>\n", + " <td>98.450000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.450000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.450000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.450000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44224</th>\n", + " <td>NaN</td>\n", + " <td>98.130000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.130000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.130000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.130000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44225</th>\n", + " <td>NaN</td>\n", + " <td>97.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.900002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44226</th>\n", + " <td>99.753333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.753333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.753333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.753333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44227</th>\n", + " <td>NaN</td>\n", + " <td>98.071875</td>\n", + " <td>NaN</td>\n", + " <td>99.408525</td>\n", + " <td>NaN</td>\n", + " <td>98.071875</td>\n", + " <td>NaN</td>\n", + " <td>99.408525</td>\n", + " <td>NaN</td>\n", + " <td>98.071875</td>\n", + " <td>NaN</td>\n", + " <td>99.408525</td>\n", + " <td>NaN</td>\n", + " <td>98.071875</td>\n", + " <td>NaN</td>\n", + " <td>99.408525</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44228</th>\n", + " <td>NaN</td>\n", + " <td>100.526316</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.526316</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.526316</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.526316</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44229</th>\n", + " <td>97.580000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.580000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.580000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.580000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44230</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.398333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.398333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.398333</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>99.398333</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44231</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.928572</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.928572</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.928572</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.928572</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44232</th>\n", + " <td>98.484375</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.484375</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.484375</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.484375</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44233</th>\n", + " <td>NaN</td>\n", + " <td>100.278462</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.278462</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.278462</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>100.278462</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44234</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.112000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.112000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.112000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.112000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44235</th>\n", + " <td>NaN</td>\n", + " <td>97.074999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.074999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.074999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.074999</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44236</th>\n", + " <td>97.977778</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.977778</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.977778</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.977778</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44237</th>\n", + " <td>NaN</td>\n", + " <td>97.485713</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.485713</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.485713</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.485713</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44238</th>\n", + " <td>NaN</td>\n", + " <td>97.264285</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.264285</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.264285</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.264285</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44239</th>\n", + " <td>NaN</td>\n", + " <td>95.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>95.400002</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44240</th>\n", + " <td>95.800000</td>\n", + " <td>NaN</td>\n", + " <td>94.640000</td>\n", + " <td>NaN</td>\n", + " <td>95.800000</td>\n", + " <td>NaN</td>\n", + " <td>94.640000</td>\n", + " <td>NaN</td>\n", + " <td>95.800000</td>\n", + " <td>NaN</td>\n", + " <td>94.640000</td>\n", + " <td>NaN</td>\n", + " <td>95.800000</td>\n", + " <td>NaN</td>\n", + " <td>94.640000</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44241</th>\n", + " <td>NaN</td>\n", + " <td>97.670000</td>\n", + " <td>NaN</td>\n", + " <td>99.357306</td>\n", + " <td>NaN</td>\n", + " <td>97.670000</td>\n", + " <td>NaN</td>\n", + " <td>99.357306</td>\n", + " <td>NaN</td>\n", + " <td>97.670000</td>\n", + " <td>NaN</td>\n", + " <td>99.357306</td>\n", + " <td>NaN</td>\n", + " <td>97.670000</td>\n", + " <td>NaN</td>\n", + " <td>99.357306</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44242</th>\n", + " <td>NaN</td>\n", + " <td>98.980953</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.980953</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.980953</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.980953</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44243</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.350000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.350000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.350000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>96.350000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44244</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.117143</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.117143</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.117143</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>97.117143</td>\n", + " </tr>\n", + " <tr>\n", + " <th>44245</th>\n", + " <td>98.655000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.655000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.655000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>98.655000</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>44246 rows × 16 columns</p>\n", + "</div>" + ], + "text/plain": [ + " temperature body_known_qn_degF_223761_MEAN \\\n", + "0 98.537500 \n", + "1 97.166667 \n", + "2 NaN \n", + "3 NaN \n", + "4 98.100000 \n", + "5 98.550000 \n", + "6 98.380000 \n", + "7 NaN \n", + "8 97.975000 \n", + "9 96.050000 \n", + "10 NaN \n", + "11 NaN \n", + "12 99.466667 \n", + "13 NaN \n", + "14 NaN \n", + "15 98.500000 \n", + "16 100.772222 \n", + "17 NaN \n", + "18 99.345455 \n", + "19 NaN \n", + "20 98.312500 \n", + "21 97.760000 \n", + "22 NaN \n", + "23 NaN \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 96.525000 \n", + "... ... \n", + "44216 NaN \n", + "44217 98.475000 \n", + "44218 96.275000 \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 99.240000 \n", + "44223 98.450000 \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 99.753333 \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 97.580000 \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 98.484375 \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 97.977778 \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 95.800000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 98.655000 \n", + "\n", + " temperature body_known_qn_degF_678_MEAN \\\n", + "0 NaN \n", + "1 NaN \n", + "2 97.533334 \n", + "3 98.591667 \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 100.649998 \n", + "8 NaN \n", + "9 NaN \n", + "10 98.536364 \n", + "11 NaN \n", + "12 NaN \n", + "13 99.099998 \n", + "14 95.300003 \n", + "15 NaN \n", + "16 NaN \n", + "17 NaN \n", + "18 NaN \n", + "19 98.800003 \n", + "20 NaN \n", + "21 NaN \n", + "22 98.445455 \n", + "23 NaN \n", + "24 NaN \n", + "25 97.320000 \n", + "26 96.700000 \n", + "27 96.920000 \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 98.302703 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 97.800003 \n", + "44220 95.740001 \n", + "44221 97.920000 \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 98.130000 \n", + "44225 97.900002 \n", + "44226 NaN \n", + "44227 98.071875 \n", + "44228 100.526316 \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 100.278462 \n", + "44234 NaN \n", + "44235 97.074999 \n", + "44236 NaN \n", + "44237 97.485713 \n", + "44238 97.264285 \n", + "44239 95.400002 \n", + "44240 NaN \n", + "44241 97.670000 \n", + "44242 98.980953 \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223762(degC)_MEAN \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 97.721177 \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 97.481429 \n", + "12 NaN \n", + "13 NaN \n", + "14 NaN \n", + "15 NaN \n", + "16 99.895122 \n", + "17 NaN \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 94.983637 \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 NaN \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 97.112000 \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 94.640000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_676(degC)_MEAN \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 NaN \n", + "12 NaN \n", + "13 98.178868 \n", + "14 NaN \n", + "15 NaN \n", + "16 NaN \n", + "17 98.948750 \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 NaN \n", + "24 98.239999 \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 98.325263 \n", + "29 NaN \n", + "... ... \n", + "44216 98.639131 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 99.408525 \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 99.398333 \n", + "44231 96.928572 \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 NaN \n", + "44241 99.357306 \n", + "44242 NaN \n", + "44243 96.350000 \n", + "44244 97.117143 \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223761_STD \\\n", + "0 98.537500 \n", + "1 97.166667 \n", + "2 NaN \n", + "3 NaN \n", + "4 98.100000 \n", + "5 98.550000 \n", + "6 98.380000 \n", + "7 NaN \n", + "8 97.975000 \n", + "9 96.050000 \n", + "10 NaN \n", + "11 NaN \n", + "12 99.466667 \n", + "13 NaN \n", + "14 NaN \n", + "15 98.500000 \n", + "16 100.772222 \n", + "17 NaN \n", + "18 99.345455 \n", + "19 NaN \n", + "20 98.312500 \n", + "21 97.760000 \n", + "22 NaN \n", + "23 NaN \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 96.525000 \n", + "... ... \n", + "44216 NaN \n", + "44217 98.475000 \n", + "44218 96.275000 \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 99.240000 \n", + "44223 98.450000 \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 99.753333 \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 97.580000 \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 98.484375 \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 97.977778 \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 95.800000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 98.655000 \n", + "\n", + " temperature body_known_qn_degF_678_STD \\\n", + "0 NaN \n", + "1 NaN \n", + "2 97.533334 \n", + "3 98.591667 \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 100.649998 \n", + "8 NaN \n", + "9 NaN \n", + "10 98.536364 \n", + "11 NaN \n", + "12 NaN \n", + "13 99.099998 \n", + "14 95.300003 \n", + "15 NaN \n", + "16 NaN \n", + "17 NaN \n", + "18 NaN \n", + "19 98.800003 \n", + "20 NaN \n", + "21 NaN \n", + "22 98.445455 \n", + "23 NaN \n", + "24 NaN \n", + "25 97.320000 \n", + "26 96.700000 \n", + "27 96.920000 \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 98.302703 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 97.800003 \n", + "44220 95.740001 \n", + "44221 97.920000 \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 98.130000 \n", + "44225 97.900002 \n", + "44226 NaN \n", + "44227 98.071875 \n", + "44228 100.526316 \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 100.278462 \n", + "44234 NaN \n", + "44235 97.074999 \n", + "44236 NaN \n", + "44237 97.485713 \n", + "44238 97.264285 \n", + "44239 95.400002 \n", + "44240 NaN \n", + "44241 97.670000 \n", + "44242 98.980953 \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223762(degC)_STD \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 97.721177 \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 97.481429 \n", + "12 NaN \n", + "13 NaN \n", + "14 NaN \n", + "15 NaN \n", + "16 99.895122 \n", + "17 NaN \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 94.983637 \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 NaN \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 97.112000 \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 94.640000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_676(degC)_STD \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 NaN \n", + "12 NaN \n", + "13 98.178868 \n", + "14 NaN \n", + "15 NaN \n", + "16 NaN \n", + "17 98.948750 \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 NaN \n", + "24 98.239999 \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 98.325263 \n", + "29 NaN \n", + "... ... \n", + "44216 98.639131 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 99.408525 \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 99.398333 \n", + "44231 96.928572 \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 NaN \n", + "44241 99.357306 \n", + "44242 NaN \n", + "44243 96.350000 \n", + "44244 97.117143 \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223761_COUNT \\\n", + "0 98.537500 \n", + "1 97.166667 \n", + "2 NaN \n", + "3 NaN \n", + "4 98.100000 \n", + "5 98.550000 \n", + "6 98.380000 \n", + "7 NaN \n", + "8 97.975000 \n", + "9 96.050000 \n", + "10 NaN \n", + "11 NaN \n", + "12 99.466667 \n", + "13 NaN \n", + "14 NaN \n", + "15 98.500000 \n", + "16 100.772222 \n", + "17 NaN \n", + "18 99.345455 \n", + "19 NaN \n", + "20 98.312500 \n", + "21 97.760000 \n", + "22 NaN \n", + "23 NaN \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 96.525000 \n", + "... ... \n", + "44216 NaN \n", + "44217 98.475000 \n", + "44218 96.275000 \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 99.240000 \n", + "44223 98.450000 \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 99.753333 \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 97.580000 \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 98.484375 \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 97.977778 \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 95.800000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 98.655000 \n", + "\n", + " temperature body_known_qn_degF_678_COUNT \\\n", + "0 NaN \n", + "1 NaN \n", + "2 97.533334 \n", + "3 98.591667 \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 100.649998 \n", + "8 NaN \n", + "9 NaN \n", + "10 98.536364 \n", + "11 NaN \n", + "12 NaN \n", + "13 99.099998 \n", + "14 95.300003 \n", + "15 NaN \n", + "16 NaN \n", + "17 NaN \n", + "18 NaN \n", + "19 98.800003 \n", + "20 NaN \n", + "21 NaN \n", + "22 98.445455 \n", + "23 NaN \n", + "24 NaN \n", + "25 97.320000 \n", + "26 96.700000 \n", + "27 96.920000 \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 98.302703 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 97.800003 \n", + "44220 95.740001 \n", + "44221 97.920000 \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 98.130000 \n", + "44225 97.900002 \n", + "44226 NaN \n", + "44227 98.071875 \n", + "44228 100.526316 \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 100.278462 \n", + "44234 NaN \n", + "44235 97.074999 \n", + "44236 NaN \n", + "44237 97.485713 \n", + "44238 97.264285 \n", + "44239 95.400002 \n", + "44240 NaN \n", + "44241 97.670000 \n", + "44242 98.980953 \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223762(degC)_COUNT \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 97.721177 \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 97.481429 \n", + "12 NaN \n", + "13 NaN \n", + "14 NaN \n", + "15 NaN \n", + "16 99.895122 \n", + "17 NaN \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 94.983637 \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 NaN \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 97.112000 \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 94.640000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_676(degC)_COUNT \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 NaN \n", + "12 NaN \n", + "13 98.178868 \n", + "14 NaN \n", + "15 NaN \n", + "16 NaN \n", + "17 98.948750 \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 NaN \n", + "24 98.239999 \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 98.325263 \n", + "29 NaN \n", + "... ... \n", + "44216 98.639131 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 99.408525 \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 99.398333 \n", + "44231 96.928572 \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 NaN \n", + "44241 99.357306 \n", + "44242 NaN \n", + "44243 96.350000 \n", + "44244 97.117143 \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223761_LAST \\\n", + "0 98.537500 \n", + "1 97.166667 \n", + "2 NaN \n", + "3 NaN \n", + "4 98.100000 \n", + "5 98.550000 \n", + "6 98.380000 \n", + "7 NaN \n", + "8 97.975000 \n", + "9 96.050000 \n", + "10 NaN \n", + "11 NaN \n", + "12 99.466667 \n", + "13 NaN \n", + "14 NaN \n", + "15 98.500000 \n", + "16 100.772222 \n", + "17 NaN \n", + "18 99.345455 \n", + "19 NaN \n", + "20 98.312500 \n", + "21 97.760000 \n", + "22 NaN \n", + "23 NaN \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 96.525000 \n", + "... ... \n", + "44216 NaN \n", + "44217 98.475000 \n", + "44218 96.275000 \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 99.240000 \n", + "44223 98.450000 \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 99.753333 \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 97.580000 \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 98.484375 \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 97.977778 \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 95.800000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 98.655000 \n", + "\n", + " temperature body_known_qn_degF_678_LAST \\\n", + "0 NaN \n", + "1 NaN \n", + "2 97.533334 \n", + "3 98.591667 \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 100.649998 \n", + "8 NaN \n", + "9 NaN \n", + "10 98.536364 \n", + "11 NaN \n", + "12 NaN \n", + "13 99.099998 \n", + "14 95.300003 \n", + "15 NaN \n", + "16 NaN \n", + "17 NaN \n", + "18 NaN \n", + "19 98.800003 \n", + "20 NaN \n", + "21 NaN \n", + "22 98.445455 \n", + "23 NaN \n", + "24 NaN \n", + "25 97.320000 \n", + "26 96.700000 \n", + "27 96.920000 \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 98.302703 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 97.800003 \n", + "44220 95.740001 \n", + "44221 97.920000 \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 98.130000 \n", + "44225 97.900002 \n", + "44226 NaN \n", + "44227 98.071875 \n", + "44228 100.526316 \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 100.278462 \n", + "44234 NaN \n", + "44235 97.074999 \n", + "44236 NaN \n", + "44237 97.485713 \n", + "44238 97.264285 \n", + "44239 95.400002 \n", + "44240 NaN \n", + "44241 97.670000 \n", + "44242 98.980953 \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_223762(degC)_LAST \\\n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 97.721177 \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 97.481429 \n", + "12 NaN \n", + "13 NaN \n", + "14 NaN \n", + "15 NaN \n", + "16 99.895122 \n", + "17 NaN \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 94.983637 \n", + "24 NaN \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 NaN \n", + "29 NaN \n", + "... ... \n", + "44216 NaN \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 NaN \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 NaN \n", + "44231 NaN \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 97.112000 \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 94.640000 \n", + "44241 NaN \n", + "44242 NaN \n", + "44243 NaN \n", + "44244 NaN \n", + "44245 NaN \n", + "\n", + " temperature body_known_qn_degF_676(degC)_LAST \n", + "0 NaN \n", + "1 NaN \n", + "2 NaN \n", + "3 NaN \n", + "4 NaN \n", + "5 NaN \n", + "6 NaN \n", + "7 NaN \n", + "8 NaN \n", + "9 NaN \n", + "10 NaN \n", + "11 NaN \n", + "12 NaN \n", + "13 98.178868 \n", + "14 NaN \n", + "15 NaN \n", + "16 NaN \n", + "17 98.948750 \n", + "18 NaN \n", + "19 NaN \n", + "20 NaN \n", + "21 NaN \n", + "22 NaN \n", + "23 NaN \n", + "24 98.239999 \n", + "25 NaN \n", + "26 NaN \n", + "27 NaN \n", + "28 98.325263 \n", + "29 NaN \n", + "... ... \n", + "44216 98.639131 \n", + "44217 NaN \n", + "44218 NaN \n", + "44219 NaN \n", + "44220 NaN \n", + "44221 NaN \n", + "44222 NaN \n", + "44223 NaN \n", + "44224 NaN \n", + "44225 NaN \n", + "44226 NaN \n", + "44227 99.408525 \n", + "44228 NaN \n", + "44229 NaN \n", + "44230 99.398333 \n", + "44231 96.928572 \n", + "44232 NaN \n", + "44233 NaN \n", + "44234 NaN \n", + "44235 NaN \n", + "44236 NaN \n", + "44237 NaN \n", + "44238 NaN \n", + "44239 NaN \n", + "44240 NaN \n", + "44241 99.357306 \n", + "44242 NaN \n", + "44243 96.350000 \n", + "44244 97.117143 \n", + "44245 NaN \n", + "\n", + "[44246 rows x 16 columns]" + ] + }, + "execution_count": 121, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "test_mapper_pipeline.transform(df)" + ] + }, + { + "cell_type": "code", + "execution_count": 152, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "<units.MedicalUreg at 0x31082eb8>" + ] + }, + "execution_count": 152, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ureg" + ] + }, + { + "cell_type": "code", + "execution_count": 197, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "mass = ureg.parse_units('degF')" + ] + }, + { + "cell_type": "code", + "execution_count": 198, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "<UnitsContainer({'[temperature]': 1.0})>" + ] + }, + "execution_count": 198, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "mass.dimensionality" + ] + }, + { + "cell_type": "code", + "execution_count": 157, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "from pint.unit import UnitsContainer" + ] + }, + { + "cell_type": "code", + "execution_count": 160, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "True" + ] + }, + "execution_count": 160, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "units.dimensionality == UnitsContainer({'[length]':3.0})" + ] + }, + { + "cell_type": "code", + "execution_count": 166, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "1e-06 kilogram" + ], + "text/latex": [ + "$1e-06\\ \\mathrm{kilogram}$" + ], + "text/plain": [ + "<Quantity(1e-06, 'kilogram')>" + ] + }, + "execution_count": 166, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "(1*units).to_base_units()" + ] + }, + { + "cell_type": "code", + "execution_count": 161, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "uc = UnitsContainer({'[length]':3.0})" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "uc.dim" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "import constants\n", + "import mimic\n", + "import utils\n", + "import pandas as pd\n", + "import icu_data_defs\n", + "import units\n", + "from sklearn.pipeline import Pipeline\n", + "import transformers\n", + "import logger\n", + "import features\n", + "import warnings\n", + "warnings.filterwarnings('ignore')" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(mimic)\n", + "reload(units)\n", + "reload(utils)\n", + "reload(transformers)\n", + "def mimic_ETL(components,data_dict,hdf5_fname,\n", + " hadm_ids=constants.ALL,\n", + " agg_func=lambda x:x.iloc[0]):\n", + " \n", + " logger.log('BEGIN ETL for {} admissions'.format(hadm_ids if hadm_ids == constants.ALL else len(hadm_ids)),new_level=True)\n", + " category_map = mimic.mimic_category_map(data_dict)\n", + " ureg = units.MedicalUreg()\n", + " extractor = mimic.mimic_extractor('config/mimic_item_map.csv',data_dict)\n", + " \n", + "\n", + " transform_pipeline = mimic.transform_pipeline()\n", + "\n", + " standard_clean_pipeline = Pipeline([\n", + " ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func)),\n", + " ('split_dtype',transformers.split_dtype()),\n", + " ('standardize_columns',transformers.column_standardizer(data_dict,ureg)),\n", + " ('standardize_categories',transformers.standardize_categories(data_dict,category_map)),\n", + " ('split_bad_categories',transformers.split_bad_categories(data_dict)),\n", + " ('one_hotter',transformers.nominal_to_onehot()),\n", + " ('drop_oob_values',transformers.oob_value_remover(data_dict))\n", + " ])\n", + " \n", + "\n", + " logger.log('Extract CONTEXT...')\n", + " df_context = mimic.get_context_data(hadm_ids)\n", + " utils.save_df(df_context,hdf5_fname,'context')\n", + "\n", + " \n", + " for component in components:\n", + " logger.log(component.upper(),new_level=True)\n", + " \n", + " logger.log(\"Extracting...\",new_level=True)\n", + " df_extracted = extractor.extract_component(component,hadm_ids)\n", + " utils.save_df(df_extracted,hdf5_fname,'extracted/{}'.format(component))\n", + " logger.end_log_level()\n", + " \n", + " display(df_extracted.head())\n", + " \n", + " logger.log(\"Transforming... {}\".format(df_extracted.shape))\n", + " transform_pipeline.set_params(add_level__level_val=component)\n", + " df_transformed = transform_pipeline.transform(df_extracted)\n", + " utils.save_df(df_transformed,hdf5_fname,'transformed/{}'.format(component))\n", + "\n", + " display(df_transformed.head())\n", + "\n", + " display(df_transformed.describe())\n", + "\n", + " print utils.data_loss(df_extracted.set_index('id').value.to_frame(),df_transformed)\n", + " \n", + " logger.log(\"Cleaning... {}\".format(df_transformed.shape)) \n", + " df_cleaned = standard_clean_pipeline.transform(df_transformed)\n", + " utils.save_df(df_cleaned,hdf5_fname,'cleaned/{}'.format(component))\n", + " \n", + " display(df_cleaned.head())\n", + "\n", + " display(df_cleaned.describe())\n", + "\n", + " print utils.data_loss(df_extracted.set_index('id').value.to_frame(),df_cleaned)\n", + " \n", + " del df_cleaned,df_transformed,df_extracted\n", + " logger.end_log_level()\n", + " \n", + " \n", + " \n", + " logger.end_log()\n", + " \n", + " return\n", + " \n", + "\n", + "def mimic_features(hdf5_fname,specific_path,labels,\n", + " custom_cleaners,segmenter,feature_tuples):\n", + " \n", + " \n", + " df_all = None\n", + " \n", + " for label in labels:\n", + " df_base = utils.open_df(hdf5_fname,'cleaned/{}'.format(label))\n", + " \n", + " df_cleaned = custom_cleaners.transform(df_base)\n", + " utils.save_df(df_cleaned,hdf5_fname,'{}/cleaned/{}'.format(specific_path,label))\n", + " \n", + " if df_all is None:\n", + " df_all = df_cleaned\n", + " else:\n", + " df_all = df_all.join(df_cleaned,how='outer')\n", + " del df_cleaned\n", + " \n", + " utils.save_df(df_all,hdf5_fname,'{}/cleaned/all')\n", + " \n", + " df_segmented = segmenter.transform(df_all)\n", + " utils.save_df(df_segmented,hdf5_fname_target,'{}/segmented'.format(specific_path))\n", + " del df_all\n", + " \n", + " mapped_ft = features.make_mapper(feature_tuples,df_segmented)\n", + " df_features = mapped_ft.transform(df_segmented)\n", + " utils.save_df(df_features,hdf5_fname_target,'{}/features'.format(specific_path))\n", + " del df_segmented\n", + " \n", + " return df_features" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "def do_ETL(data_dict,components,tag,n,seed=42):\n", + " hdf5_fname = 'data/mimic_{}_{}'.format(tag,n)\n", + " hadm_ids = n if n == constants.ALL else mimic.sample_hadm_ids(n,seed) \n", + " mimic_ETL(components,data_dict,hdf5_fname,hadm_ids=hadm_ids)\n", + " return hdf5_fname" + ] + }, + { + "cell_type": "code", + "execution_count": 43, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "reload(logger)\n", + "\n", + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n", + "components = data_dict.get_panel_defintions(12).component.unique().tolist() #12 is \"simple data\"\n", + "tag = 'simple'" + ] + }, + { + "cell_type": "code", + "execution_count": 40, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-20 10:03:09) BEGIN ETL for 1000 admissions\n", + "(2017-06-20 10:03:09)>> Extract CONTEXT...\n", + "(2017-06-20 10:03:17)<< DONE (8.0s)\n", + "(2017-06-20 10:03:17)>> BLOOD PRESSURE SYSTOLIC\n", + "(2017-06-20 10:03:17)>>>> Extracting...\n", + "(2017-06-20 10:03:17)>>>>>> Extracting 14 items from chartevents\n", + "51 35823\n", + "455 26680\n", + "220179 21957\n", + "220050 15186\n", + "3313 2250\n", + "225309 1251\n", + "3315 50\n", + "3317 24\n", + "3323 21\n", + "442 19\n", + "3321 19\n", + "224167 12\n", + "227243 8\n", + "Name: itemid, dtype: int64\n", + "Empty DataFrame\n", + "Columns: [id, datetime, value, units, itemid]\n", + "Index: []\n", + "(2017-06-20 10:04:09)<<<<<< DONE (52.0s)\n", + "(2017-06-20 10:04:09)>>>>>> Combine DF\n", + "(2017-06-20 10:04:09)<<<<<< DONE (0.0s)\n", + "(2017-06-20 10:04:09)>>>>>> Clean UOM\n", + "(2017-06-20 10:04:10)<<<<<< DONE (1.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th>value</th>\n", + " <th>units</th>\n", + " <th>itemid</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>107880</td>\n", + " <td>2106-06-19 22:00:00</td>\n", + " <td>99</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>107880</td>\n", + " <td>2106-06-19 23:00:00</td>\n", + " <td>98</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>107880</td>\n", + " <td>2106-06-20 00:00:00</td>\n", + " <td>122</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>107880</td>\n", + " <td>2106-06-20 01:00:00</td>\n", + " <td>150</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>107880</td>\n", + " <td>2106-06-20 02:00:00</td>\n", + " <td>133</td>\n", + " <td>mmHg</td>\n", + " <td>51</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " id datetime value units itemid\n", + "0 107880 2106-06-19 22:00:00 99 mmHg 51\n", + "1 107880 2106-06-19 23:00:00 98 mmHg 51\n", + "2 107880 2106-06-20 00:00:00 122 mmHg 51\n", + "3 107880 2106-06-20 01:00:00 150 mmHg 51\n", + "4 107880 2106-06-20 02:00:00 133 mmHg 51" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-20 10:04:10)<<<< DONE (53.0s)\n", + "(2017-06-20 10:04:10)>>>> Transforming... (103300, 5)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>component</th>\n", + " <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th>cc/min</th>\n", + " <th colspan=\"5\" halign=\"left\">mmHg</th>\n", + " <th colspan=\"4\" halign=\"left\">cc/min</th>\n", + " <th colspan=\"3\" halign=\"left\">mmHg</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>3313</th>\n", + " <th>455</th>\n", + " <th>51</th>\n", + " <th>220179</th>\n", + " <th>442</th>\n", + " <th>220050</th>\n", + " <th>3315</th>\n", + " <th>3317</th>\n", + " <th>3321</th>\n", + " <th>3323</th>\n", + " <th>224167</th>\n", + " <th>227243</th>\n", + " <th>225309</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100304</th>\n", + " <th>2161-10-01 22:00:00</th>\n", + " <td>67</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2161-10-01 23:00:00</th>\n", + " <td>68</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100788</th>\n", + " <th>2120-04-10 14:00:00</th>\n", + " <td>None</td>\n", + " <td>127</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2120-04-10 15:00:00</th>\n", + " <td>None</td>\n", + " <td>127</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2120-04-10 16:00:00</th>\n", + " <td>None</td>\n", + " <td>123</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " <td>None</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "component blood pressure systolic \\\n", + "units cc/min mmHg \n", + "description 3313 455 51 220179 \n", + "id datetime \n", + "100304 2161-10-01 22:00:00 67 None None None \n", + " 2161-10-01 23:00:00 68 None None None \n", + "100788 2120-04-10 14:00:00 None 127 None None \n", + " 2120-04-10 15:00:00 None 127 None None \n", + " 2120-04-10 16:00:00 None 123 None None \n", + "\n", + "component \\\n", + "units cc/min mmHg \n", + "description 442 220050 3315 3317 3321 3323 224167 \n", + "id datetime \n", + "100304 2161-10-01 22:00:00 None None None None None None None \n", + " 2161-10-01 23:00:00 None None None None None None None \n", + "100788 2120-04-10 14:00:00 None None None None None None None \n", + " 2120-04-10 15:00:00 None None None None None None None \n", + " 2120-04-10 16:00:00 None None None None None None None \n", + "\n", + "component \n", + "units \n", + "description 227243 225309 \n", + "id datetime \n", + "100304 2161-10-01 22:00:00 None None \n", + " 2161-10-01 23:00:00 None None \n", + "100788 2120-04-10 14:00:00 None None \n", + " 2120-04-10 15:00:00 None None \n", + " 2120-04-10 16:00:00 None None " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>component</th>\n", + " <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th>cc/min</th>\n", + " <th colspan=\"5\" halign=\"left\">mmHg</th>\n", + " <th colspan=\"4\" halign=\"left\">cc/min</th>\n", + " <th colspan=\"3\" halign=\"left\">mmHg</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>3313</th>\n", + " <th>455</th>\n", + " <th>51</th>\n", + " <th>220179</th>\n", + " <th>442</th>\n", + " <th>220050</th>\n", + " <th>3315</th>\n", + " <th>3317</th>\n", + " <th>3321</th>\n", + " <th>3323</th>\n", + " <th>224167</th>\n", + " <th>227243</th>\n", + " <th>225309</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>2241</td>\n", + " <td>26480</td>\n", + " <td>35622</td>\n", + " <td>21957</td>\n", + " <td>17</td>\n", + " <td>15186</td>\n", + " <td>22</td>\n", + " <td>16</td>\n", + " <td>13</td>\n", + " <td>14</td>\n", + " <td>12</td>\n", + " <td>8</td>\n", + " <td>1251</td>\n", + " </tr>\n", + " <tr>\n", + " <th>unique</th>\n", + " <td>81</td>\n", + " <td>181</td>\n", + " <td>208</td>\n", + " <td>176</td>\n", + " <td>14</td>\n", + " <td>172</td>\n", + " <td>21</td>\n", + " <td>13</td>\n", + " <td>12</td>\n", + " <td>11</td>\n", + " <td>9</td>\n", + " <td>8</td>\n", + " <td>126</td>\n", + " </tr>\n", + " <tr>\n", + " <th>top</th>\n", + " <td>72</td>\n", + " <td>106</td>\n", + " <td>108</td>\n", + " <td>112</td>\n", + " <td>122</td>\n", + " <td>120</td>\n", + " <td>89</td>\n", + " <td>74</td>\n", + " <td>66</td>\n", + " <td>80</td>\n", + " <td>102</td>\n", + " <td>110</td>\n", + " <td>107</td>\n", + " </tr>\n", + " <tr>\n", + " <th>freq</th>\n", + " <td>91</td>\n", + " <td>494</td>\n", + " <td>641</td>\n", + " <td>457</td>\n", + " <td>2</td>\n", + " <td>296</td>\n", + " <td>2</td>\n", + " <td>2</td>\n", + " <td>2</td>\n", + " <td>2</td>\n", + " <td>4</td>\n", + " <td>1</td>\n", + " <td>41</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "component blood pressure systolic \\\n", + "units cc/min mmHg cc/min \n", + "description 3313 455 51 220179 442 220050 3315 \n", + "count 2241 26480 35622 21957 17 15186 22 \n", + "unique 81 181 208 176 14 172 21 \n", + "top 72 106 108 112 122 120 89 \n", + "freq 91 494 641 457 2 296 2 \n", + "\n", + "component \n", + "units mmHg \n", + "description 3317 3321 3323 224167 227243 225309 \n", + "count 16 13 14 12 8 1251 \n", + "unique 13 12 11 9 8 126 \n", + "top 74 66 80 102 110 107 \n", + "freq 2 2 2 4 1 41 " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "((103300, 1), (97535, 13), 461L, 2, '0.2094% records')\n", + "(2017-06-20 10:04:12)<<<< DONE (2.0s)\n", + "(2017-06-20 10:04:12)>>>> Cleaning... (97535, 13)\n", + "(2017-06-20 10:04:14)<<<< DONE (2.0s)\n", + "(2017-06-20 10:04:14)>>>> Nominal to OneHot\n", + "(2017-06-20 10:04:14)<<<< DONE (0.0s)\n", + "(2017-06-20 10:04:14)>>>> Drop OOB data | (97527, 13)\n", + "(2017-06-20 10:04:14)>>>>>> blood pressure systolic, mmHg, 100525\n", + "(2017-06-20 10:04:19)<<<<<< DONE (5.0s)\n", + "(2017-06-20 10:04:19)>>>>>> blood pressure systolic, cc/min, 2306\n", + "(2017-06-20 10:04:19)<<<<<< DONE (0.0s)\n" + ] + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th></th>\n", + " <th>component</th>\n", + " <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>status</th>\n", + " <th colspan=\"8\" halign=\"left\">known</th>\n", + " <th colspan=\"5\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>variable_type</th>\n", + " <th colspan=\"8\" halign=\"left\">qn</th>\n", + " <th colspan=\"5\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>units</th>\n", + " <th colspan=\"8\" halign=\"left\">mmHg</th>\n", + " <th colspan=\"5\" halign=\"left\">cc/min</th>\n", + " </tr>\n", + " <tr>\n", + " <th></th>\n", + " <th>description</th>\n", + " <th>220050</th>\n", + " <th>220179</th>\n", + " <th>224167</th>\n", + " <th>225309</th>\n", + " <th>227243</th>\n", + " <th>442</th>\n", + " <th>455</th>\n", + " <th>51</th>\n", + " <th>3313</th>\n", + " <th>3315</th>\n", + " <th>3317</th>\n", + " <th>3321</th>\n", + " <th>3323</th>\n", + " </tr>\n", + " <tr>\n", + " <th>id</th>\n", + " <th>datetime</th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " <th></th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th rowspan=\"2\" valign=\"top\">100304</th>\n", + " <th>2161-10-01 22:00:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>67.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2161-10-01 23:00:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>68.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th rowspan=\"3\" valign=\"top\">100788</th>\n", + " <th>2120-04-10 14:00:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>127.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2120-04-10 15:00:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>127.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2120-04-10 16:00:00</th>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>123.0</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " <td>NaN</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "component blood pressure systolic \\\n", + "status known \n", + "variable_type qn \n", + "units mmHg \n", + "description 220050 220179 224167 225309 \n", + "id datetime \n", + "100304 2161-10-01 22:00:00 NaN NaN NaN NaN \n", + " 2161-10-01 23:00:00 NaN NaN NaN NaN \n", + "100788 2120-04-10 14:00:00 NaN NaN NaN NaN \n", + " 2120-04-10 15:00:00 NaN NaN NaN NaN \n", + " 2120-04-10 16:00:00 NaN NaN NaN NaN \n", + "\n", + "component \n", + "status unknown \n", + "variable_type qn \n", + "units cc/min \n", + "description 227243 442 455 51 3313 3315 3317 3321 3323 \n", + "id datetime \n", + "100304 2161-10-01 22:00:00 NaN NaN NaN NaN 67.0 NaN NaN NaN NaN \n", + " 2161-10-01 23:00:00 NaN NaN NaN NaN 68.0 NaN NaN NaN NaN \n", + "100788 2120-04-10 14:00:00 NaN NaN 127.0 NaN NaN NaN NaN NaN NaN \n", + " 2120-04-10 15:00:00 NaN NaN 127.0 NaN NaN NaN NaN NaN NaN \n", + " 2120-04-10 16:00:00 NaN NaN 123.0 NaN NaN NaN NaN NaN NaN " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "<div>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr>\n", + " <th>component</th>\n", + " <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n", + " </tr>\n", + " <tr>\n", + " <th>status</th>\n", + " <th colspan=\"8\" halign=\"left\">known</th>\n", + " <th colspan=\"5\" halign=\"left\">unknown</th>\n", + " </tr>\n", + " <tr>\n", + " <th>variable_type</th>\n", + " <th colspan=\"8\" halign=\"left\">qn</th>\n", + " <th colspan=\"5\" halign=\"left\">qn</th>\n", + " </tr>\n", + " <tr>\n", + " <th>units</th>\n", + " <th colspan=\"8\" halign=\"left\">mmHg</th>\n", + " <th colspan=\"5\" halign=\"left\">cc/min</th>\n", + " </tr>\n", + " <tr>\n", + " <th>description</th>\n", + " <th>220050</th>\n", + " <th>220179</th>\n", + " <th>224167</th>\n", + " <th>225309</th>\n", + " <th>227243</th>\n", + " <th>442</th>\n", + " <th>455</th>\n", + " <th>51</th>\n", + " <th>3313</th>\n", + " <th>3315</th>\n", + " <th>3317</th>\n", + " <th>3321</th>\n", + " <th>3323</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>count</th>\n", + " <td>15186.000000</td>\n", + " <td>21957.000000</td>\n", + " <td>12.000000</td>\n", + " <td>1251.000000</td>\n", + " <td>8.00000</td>\n", + " <td>17.000000</td>\n", + " <td>26478.000000</td>\n", + " <td>35616.000000</td>\n", + " <td>2241.000000</td>\n", + " <td>22.000000</td>\n", + " <td>16.00000</td>\n", + " <td>13.000000</td>\n", + " <td>14.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>mean</th>\n", + " <td>118.988213</td>\n", + " <td>119.200483</td>\n", + " <td>104.416667</td>\n", + " <td>110.457234</td>\n", + " <td>111.87500</td>\n", + " <td>122.882353</td>\n", + " <td>119.150623</td>\n", + " <td>121.264628</td>\n", + " <td>70.371709</td>\n", + " <td>77.727273</td>\n", + " <td>76.68750</td>\n", + " <td>77.846154</td>\n", + " <td>75.714286</td>\n", + " </tr>\n", + " <tr>\n", + " <th>std</th>\n", + " <td>23.366007</td>\n", + " <td>21.757748</td>\n", + " <td>15.559027</td>\n", + " <td>20.465707</td>\n", + " <td>19.05209</td>\n", + " <td>31.262762</td>\n", + " <td>23.206573</td>\n", + " <td>25.927916</td>\n", + " <td>12.969975</td>\n", + " <td>15.495566</td>\n", + " <td>17.72651</td>\n", + " <td>14.932326</td>\n", + " <td>14.514865</td>\n", + " </tr>\n", + " <tr>\n", + " <th>min</th>\n", + " <td>0.000000</td>\n", + " <td>33.000000</td>\n", + " <td>86.000000</td>\n", + " <td>23.000000</td>\n", + " <td>84.00000</td>\n", + " <td>70.000000</td>\n", + " <td>0.000000</td>\n", + " <td>0.000000</td>\n", + " <td>38.000000</td>\n", + " <td>54.000000</td>\n", + " <td>50.00000</td>\n", + " <td>58.000000</td>\n", + " <td>55.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>25%</th>\n", + " <td>103.000000</td>\n", + " <td>104.000000</td>\n", + " <td>97.500000</td>\n", + " <td>99.000000</td>\n", + " <td>97.25000</td>\n", + " <td>96.000000</td>\n", + " <td>102.000000</td>\n", + " <td>104.000000</td>\n", + " <td>61.000000</td>\n", + " <td>66.250000</td>\n", + " <td>62.75000</td>\n", + " <td>67.000000</td>\n", + " <td>66.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>50%</th>\n", + " <td>117.000000</td>\n", + " <td>117.000000</td>\n", + " <td>102.000000</td>\n", + " <td>108.000000</td>\n", + " <td>116.00000</td>\n", + " <td>125.000000</td>\n", + " <td>117.000000</td>\n", + " <td>119.000000</td>\n", + " <td>70.000000</td>\n", + " <td>76.000000</td>\n", + " <td>76.00000</td>\n", + " <td>75.000000</td>\n", + " <td>75.500000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75%</th>\n", + " <td>133.000000</td>\n", + " <td>133.000000</td>\n", + " <td>104.000000</td>\n", + " <td>120.000000</td>\n", + " <td>128.50000</td>\n", + " <td>138.000000</td>\n", + " <td>135.000000</td>\n", + " <td>137.000000</td>\n", + " <td>77.000000</td>\n", + " <td>86.750000</td>\n", + " <td>86.00000</td>\n", + " <td>84.000000</td>\n", + " <td>80.000000</td>\n", + " </tr>\n", + " <tr>\n", + " <th>max</th>\n", + " <td>244.000000</td>\n", + " <td>247.000000</td>\n", + " <td>144.000000</td>\n", + " <td>273.000000</td>\n", + " <td>132.00000</td>\n", + " <td>174.000000</td>\n", + " <td>234.000000</td>\n", + " <td>284.000000</td>\n", + " <td>123.000000</td>\n", + " <td>112.000000</td>\n", + " <td>120.00000</td>\n", + " <td>108.000000</td>\n", + " <td>99.000000</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + "component blood pressure systolic \\\n", + "status known \n", + "variable_type qn \n", + "units mmHg \n", + "description 220050 220179 224167 225309 \n", + "count 15186.000000 21957.000000 12.000000 1251.000000 \n", + "mean 118.988213 119.200483 104.416667 110.457234 \n", + "std 23.366007 21.757748 15.559027 20.465707 \n", + "min 0.000000 33.000000 86.000000 23.000000 \n", + "25% 103.000000 104.000000 97.500000 99.000000 \n", + "50% 117.000000 117.000000 102.000000 108.000000 \n", + "75% 133.000000 133.000000 104.000000 120.000000 \n", + "max 244.000000 247.000000 144.000000 273.000000 \n", + "\n", + "component \\\n", + "status unknown \n", + "variable_type qn \n", + "units cc/min \n", + "description 227243 442 455 51 3313 \n", + "count 8.00000 17.000000 26478.000000 35616.000000 2241.000000 \n", + "mean 111.87500 122.882353 119.150623 121.264628 70.371709 \n", + "std 19.05209 31.262762 23.206573 25.927916 12.969975 \n", + "min 84.00000 70.000000 0.000000 0.000000 38.000000 \n", + "25% 97.25000 96.000000 102.000000 104.000000 61.000000 \n", + "50% 116.00000 125.000000 117.000000 119.000000 70.000000 \n", + "75% 128.50000 138.000000 135.000000 137.000000 77.000000 \n", + "max 132.00000 174.000000 234.000000 284.000000 123.000000 \n", + "\n", + "component \n", + "status \n", + "variable_type \n", + "units \n", + "description 3315 3317 3321 3323 \n", + "count 22.000000 16.00000 13.000000 14.000000 \n", + "mean 77.727273 76.68750 77.846154 75.714286 \n", + "std 15.495566 17.72651 14.932326 14.514865 \n", + "min 54.000000 50.00000 58.000000 55.000000 \n", + "25% 66.250000 62.75000 67.000000 66.000000 \n", + "50% 76.000000 76.00000 75.000000 75.500000 \n", + "75% 86.750000 86.00000 84.000000 80.000000 \n", + "max 112.000000 120.00000 108.000000 99.000000 " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "((103300, 1), (97527, 13), 469L, 2, '0.2094% records')\n", + "(2017-06-20 10:04:19)<<<< DONE (5.0s)\n", + "(2017-06-20 10:04:19)<< DONE (62.0s)\n", + "(2017-06-20 10:04:19) DONE (70.0s)\n" + ] + } + ], + "source": [ + "n = 100\n", + "hdf5_fname = do_ETL(data_dict,[data_dict.components.BLOOD_PRESSURE_SYSTOLIC],tag,n)" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-06-20 10:09:14) BEGIN ETL for all admissions\n", + "(2017-06-20 10:09:15)>> Extract CONTEXT...\n", + "(2017-06-20 10:09:27)<< DONE (12.0s)\n", + "(2017-06-20 10:09:27)>> BLOOD PRESSURE SYSTOLIC\n", + "(2017-06-20 10:09:27)>>>> Extracting...\n", + "(2017-06-20 10:09:28)>>>>>> Extracting 14 items from chartevents\n", + "51 2099353\n", + "455 1586769\n", + "220179 1290488\n", + "220050 1149788\n", + "3313 148105\n", + "225309 86557\n", + "3315 3762\n", + "442 2565\n", + "3317 2052\n", + "3323 2039\n", + "3321 2032\n", + "224167 740\n", + "227243 541\n", + "6 33\n", + "Name: itemid, dtype: int64\n", + " id datetime value units itemid\n", + "963709 136796.0 2139-10-06 21:00:00 113/55 6\n", + "963711 136796.0 2139-10-06 22:00:00 126/58 6\n", + "963713 136796.0 2139-10-06 23:00:00 139/64 6\n", + "964245 136796.0 2139-10-07 07:00:00 132/59 6\n", + "964247 136796.0 2139-10-07 08:00:00 143/63 6\n", + "964301 136796.0 2139-10-07 16:00:00 152/68 6\n", + "964304 136796.0 2139-10-07 18:00:00 141/59 6\n", + "964710 136796.0 2139-10-07 09:00:00 133/59 6\n", + "964743 136796.0 2139-10-07 10:00:00 131/60 6\n", + "965088 136796.0 2139-10-07 11:00:00 123/54 6\n", + "965090 136796.0 2139-10-07 12:00:00 185/79 6\n", + "965092 136796.0 2139-10-07 13:00:00 116/54 6\n", + "965094 136796.0 2139-10-07 14:00:00 122/57 6\n", + "965096 136796.0 2139-10-07 15:00:00 120/56 6\n", + "965438 136796.0 2139-10-06 13:00:00 122/55 6\n", + "965440 136796.0 2139-10-06 14:00:00 110/56 6\n", + "965854 136796.0 2139-10-06 18:00:00 108/56 6\n", + "965856 136796.0 2139-10-06 20:00:00 115/56 6\n", + "966407 136796.0 2139-10-07 03:00:00 129/57 6\n", + "966409 136796.0 2139-10-07 04:00:00 121/55 6\n", + "966411 136796.0 2139-10-07 05:00:00 125/56 6\n", + "968122 136796.0 2139-10-06 09:00:00 119/55 6\n", + "968125 136796.0 2139-10-06 12:00:00 113/60 6\n", + "968615 136796.0 2139-10-07 00:00:00 120/54 6\n", + "968617 136796.0 2139-10-07 01:00:00 130/58 6\n", + "968619 136796.0 2139-10-07 02:00:00 124/56 6\n" + ] + }, + { + "ename": "KeyError", + "evalue": "0L", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mKeyError\u001b[0m Traceback (most recent call last)", + "\u001b[1;32m<ipython-input-44-88e79271be02>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[0;32m 1\u001b[0m \u001b[0mn\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mconstants\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mALL\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mhdf5_fname\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdo_ETL\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mBLOOD_PRESSURE_SYSTOLIC\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'bp'\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mn\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m", + "\u001b[1;32m<ipython-input-37-093e315c4cfe>\u001b[0m in \u001b[0;36mdo_ETL\u001b[1;34m(data_dict, components, tag, n, seed)\u001b[0m\n\u001b[0;32m 2\u001b[0m \u001b[0mhdf5_fname\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'data/mimic_{}_{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mtag\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mn\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 3\u001b[0m \u001b[0mhadm_ids\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mn\u001b[0m \u001b[1;32mif\u001b[0m \u001b[0mn\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mconstants\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mALL\u001b[0m \u001b[1;32melse\u001b[0m \u001b[0mmimic\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msample_hadm_ids\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mn\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mseed\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 4\u001b[1;33m \u001b[0mmimic_ETL\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 5\u001b[0m \u001b[1;32mreturn\u001b[0m \u001b[0mhdf5_fname\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32m<ipython-input-36-1619d6fa19c9>\u001b[0m in \u001b[0;36mmimic_ETL\u001b[1;34m(components, data_dict, hdf5_fname, hadm_ids, agg_func)\u001b[0m\n\u001b[0;32m 35\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 36\u001b[0m \u001b[0mlogger\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mlog\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m\"Extracting...\"\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mnew_level\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 37\u001b[1;33m \u001b[0mdf_extracted\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mextractor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mextract_component\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 38\u001b[0m \u001b[0mutils\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msave_df\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf_extracted\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'extracted/{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 39\u001b[0m \u001b[0mlogger\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mend_log_level\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\mimic.py\u001b[0m in \u001b[0;36mextract_component\u001b[1;34m(self, component, hadm_ids)\u001b[0m\n\u001b[0;32m 95\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 96\u001b[0m \u001b[1;32mdef\u001b[0m \u001b[0mextract_component\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mALL\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 97\u001b[1;33m \u001b[1;32mreturn\u001b[0m \u001b[0mextract_component\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mconn\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mitem_map\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 98\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 99\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\mimic.py\u001b[0m in \u001b[0;36mextract_component\u001b[1;34m(mimic_conn, component, item_map, data_dict, hadm_ids)\u001b[0m\n\u001b[0;32m 132\u001b[0m \u001b[1;32mif\u001b[0m \u001b[0mbp_slice\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m!=\u001b[0m \u001b[1;36m0\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 133\u001b[0m \u001b[1;32mif\u001b[0m \u001b[0mcomponent\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdata_dict\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mBLOOD_PRESSURE_SYSTOLIC\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 134\u001b[1;33m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mis_item_6\u001b[0m \u001b[1;33m&\u001b[0m \u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mis_item_6\u001b[0m \u001b[1;33m&\u001b[0m \u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mstr\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'/'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mastype\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mint\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 135\u001b[0m \u001b[1;32melif\u001b[0m \u001b[0mcomponent\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdata_dict\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mBLOOD_PRESSURE_DIASTOLIC\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 136\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mstr\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'/'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m1\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mastype\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mint\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\series.pyc\u001b[0m in \u001b[0;36m__getitem__\u001b[1;34m(self, key)\u001b[0m\n\u001b[0;32m 599\u001b[0m \u001b[0mkey\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mcom\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_apply_if_callable\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 600\u001b[0m \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 601\u001b[1;33m \u001b[0mresult\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_value\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m 602\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 603\u001b[0m \u001b[1;32mif\u001b[0m \u001b[1;32mnot\u001b[0m \u001b[0mis_scalar\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresult\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\indexes\\base.pyc\u001b[0m in \u001b[0;36mget_value\u001b[1;34m(self, series, key)\u001b[0m\n\u001b[0;32m 2137\u001b[0m \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 2138\u001b[0m return self._engine.get_value(s, k,\n\u001b[1;32m-> 2139\u001b[1;33m tz=getattr(series.dtype, 'tz', None))\n\u001b[0m\u001b[0;32m 2140\u001b[0m \u001b[1;32mexcept\u001b[0m \u001b[0mKeyError\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0me1\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m 2141\u001b[0m \u001b[1;32mif\u001b[0m \u001b[0mlen\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m0\u001b[0m \u001b[1;32mand\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0minferred_type\u001b[0m \u001b[1;32min\u001b[0m \u001b[1;33m[\u001b[0m\u001b[1;34m'integer'\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;34m'boolean'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n", + "\u001b[1;32mpandas\\index.pyx\u001b[0m in \u001b[0;36mpandas.index.IndexEngine.get_value (pandas\\index.c:3338)\u001b[1;34m()\u001b[0m\n", + "\u001b[1;32mpandas\\index.pyx\u001b[0m in \u001b[0;36mpandas.index.IndexEngine.get_value (pandas\\index.c:3041)\u001b[1;34m()\u001b[0m\n", + "\u001b[1;32mpandas\\index.pyx\u001b[0m in \u001b[0;36mpandas.index.IndexEngine.get_loc (pandas\\index.c:4024)\u001b[1;34m()\u001b[0m\n", + "\u001b[1;32mpandas\\src\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas.hashtable.Int64HashTable.get_item (pandas\\hashtable.c:8141)\u001b[1;34m()\u001b[0m\n", + "\u001b[1;32mpandas\\src\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas.hashtable.Int64HashTable.get_item (pandas\\hashtable.c:8085)\u001b[1;34m()\u001b[0m\n", + "\u001b[1;31mKeyError\u001b[0m: 0L" + ] + } + ], + "source": [ + "n = constants.ALL\n", + "hdf5_fname = do_ETL(data_dict,[data_dict.components.BLOOD_PRESSURE_SYSTOLIC],'bp',n)" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "metadata": { + "collapsed": false, + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "<class 'pandas.io.pytables.HDFStore'>\n", + "File path: data/mimic_simple_all\n", + "/cleaned/blood pressure diastolic frame \n", + "/cleaned/blood pressure mean frame \n", + "/cleaned/blood pressure systolic frame \n", + "/cleaned/glasgow coma scale eye opening frame \n", + "/cleaned/glasgow coma scale motor frame \n", + "/cleaned/glasgow coma scale verbal frame \n", + "/cleaned/heart rate frame \n", + "/cleaned/hemoglobin frame \n", + "/cleaned/lactate frame \n", + "/cleaned/lactated ringers frame \n", + "/cleaned/norepinephrine frame \n", + "/cleaned/normal saline frame \n", + "/cleaned/output urine frame \n", + "/cleaned/oxygen saturation pulse oximetry frame \n", + "/cleaned/respiratory rate frame \n", + "/cleaned/temperature body frame \n", + "/cleaned/vasopressin frame \n", + "/cleaned/weight body frame \n", + "/context frame (shape->[62722,22]) \n", + "/extracted/blood pressure diastolic frame (shape->[6371249,5])\n", + "/extracted/blood pressure mean frame (shape->[2536271,5])\n", + "/extracted/blood pressure systolic frame (shape->[6374824,5])\n", + "/extracted/glasgow coma scale eye opening frame (shape->[956672,5]) \n", + "/extracted/glasgow coma scale motor frame (shape->[952565,5]) \n", + "/extracted/glasgow coma scale verbal frame (shape->[954700,5]) \n", + "/extracted/heart rate frame (shape->[7952939,5])\n", + "/extracted/hemoglobin frame (shape->[1167921,5])\n", + "/extracted/lactate frame (shape->[393608,5]) \n", + "/extracted/lactated ringers frame (shape->[504306,5]) \n", + "/extracted/norepinephrine frame (shape->[1136938,5])\n", + "/extracted/normal saline frame (shape->[817373,5]) \n", + "/extracted/output urine frame (shape->[3644639,5])\n", + "/extracted/oxygen saturation pulse oximetry frame (shape->[6099827,5])\n", + "/extracted/respiratory rate frame (shape->[7810019,5])\n", + "/extracted/temperature body frame (shape->[1751447,5])\n", + "/extracted/vasopressin frame (shape->[339184,5]) \n", + "/extracted/weight body frame (shape->[95425,5]) \n", + "/transformed/blood pressure diastolic frame \n", + "/transformed/blood pressure mean frame \n", + "/transformed/blood pressure systolic frame \n", + "/transformed/glasgow coma scale eye opening frame \n", + "/transformed/glasgow coma scale motor frame \n", + "/transformed/glasgow coma scale verbal frame \n", + "/transformed/heart rate frame \n", + "/transformed/hemoglobin frame \n", + "/transformed/lactate frame \n", + "/transformed/lactated ringers frame \n", + "/transformed/norepinephrine frame \n", + "/transformed/normal saline frame \n", + "/transformed/output urine frame \n", + "/transformed/oxygen saturation pulse oximetry frame \n", + "/transformed/respiratory rate frame \n", + "/transformed/temperature body frame \n", + "/transformed/vasopressin frame \n", + "/transformed/weight body frame " + ] + }, + "execution_count": 35, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "store = pd.HDFStore(hdf5_fname)\n", + "store" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "store.close()" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import utils\n", + "import mimic\n", + "import icu_data_defs\n", + "import transformers" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n", + "components = data_dict.get_panel_defintions(1).component.unique().tolist() #1 is vitals" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "data": { + "text/plain": [ + "[u'heart rate',\n", + " u'blood pressure systolic',\n", + " u'blood pressure diastolic',\n", + " u'blood pressure mean',\n", + " u'respiratory rate',\n", + " u'temperature body',\n", + " u'oxygen saturation pulse oximetry',\n", + " u'weight body']" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "components" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": { + "collapsed": false + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(2017-07-04 22:28:15)<<<<<<<< --- (25.0s)\n", + "(2017-07-04 22:28:15)>>>>>>>> ***ETL***\n", + "(2017-07-04 22:28:15)>>>>>>>>>> SETUP\n", + "(2017-07-04 22:28:15)<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:28:15)>>>>>>>>>> BEGIN ETL for all admissions and 8 components: [u'heart rate', u'blood pressure systolic', u'blood pressure diastolic', u'blood pressure mean', u'respiratory rate', u'temperature body', u'oxygen saturation pulse oximetry', u'weight body']\n", + "(2017-07-04 22:28:15)>>>>>>>>>>>> HEART RATE: 1/8\n", + "(2017-07-04 22:28:15)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 22:28:16)>>>>>>>>>>>>>>>> Extracting 5 items from chartevents\n", + "(2017-07-04 22:29:12)<<<<<<<<<<<<<<<< --- (56.0s)\n", + "(2017-07-04 22:29:12)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 22:29:13)<<<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 22:29:13)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 22:29:33)<<<<<<<<<<<<<<<< --- (20.0s)\n", + "(2017-07-04 22:29:33)<<<<<<<<<<<<<< --- (78.0s)\n", + "(2017-07-04 22:29:33)>>>>>>>>>>>>>> Transforming... (7952939, 5)\n", + "Data Loss (Extract > Transformed): ((7952939, 1), (7923711, 6), 29066L, 171, '0.3015% records')\n", + "(2017-07-04 22:31:25)<<<<<<<<<<<<<< --- (112.0s)\n", + "(2017-07-04 22:31:25)>>>>>>>>>>>>>> Cleaning... (7923711, 6)\n", + "(2017-07-04 22:32:14)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 22:32:14)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:32:14)>>>>>>>>>>>>>>>> Drop OOB data | (7922986, 6)\n", + "(2017-07-04 22:32:18)>>>>>>>>>>>>>>>>>> heart rate, beats/min, 7923117\n", + "(2017-07-04 22:33:29)<<<<<<<<<<<<<<<<<< --- (71.0s)\n", + "(2017-07-04 22:33:29)>>>>>>>>>>>>>>>>>> heart rate, no_units, 31\n", + "(2017-07-04 22:33:29)<<<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:33:29)<<<<<<<<<<<<<<<< --- (75.0s)\n", + "Data Loss (Extract > Cleaned): ((7952939, 1), (7922986, 6), 29804L, 171, '0.3015% records')\n", + "(2017-07-04 22:33:31)<<<<<<<<<<<<<< --- (126.0s)\n", + "(2017-07-04 22:33:31)>>>>>>>>>>>>>> Filter & sort - (7922986, 6)\n", + "(2017-07-04 22:33:35)<<<<<<<<<<<<<< --- (4.0s)\n", + "(2017-07-04 22:33:35)>>>>>>>>>>>>>> Convert to dask - (7922986, 6)\n", + "(2017-07-04 22:33:36)<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 22:33:36)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 22:33:36)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:33:36)<<<<<<<<<<<< --- (321.0s)\n", + "(2017-07-04 22:33:36)>>>>>>>>>>>> BLOOD PRESSURE SYSTOLIC: 2/8\n", + "(2017-07-04 22:33:36)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 22:33:36)>>>>>>>>>>>>>>>> Extracting 14 items from chartevents\n", + "(2017-07-04 22:35:06)<<<<<<<<<<<<<<<< --- (90.0s)\n", + "(2017-07-04 22:35:06)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 22:35:06)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:35:06)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 22:35:10)<<<<<<<<<<<<<<<< --- (4.0s)\n", + "(2017-07-04 22:35:10)<<<<<<<<<<<<<< --- (94.0s)\n", + "(2017-07-04 22:35:10)>>>>>>>>>>>>>> Transforming... (6374824, 5)\n", + "Data Loss (Extract > Transformed): ((6374824, 1), (5974719, 15), 43236L, 174, '0.307% records')\n", + "(2017-07-04 22:36:52)<<<<<<<<<<<<<< --- (102.0s)\n", + "(2017-07-04 22:36:52)>>>>>>>>>>>>>> Cleaning... (5974719, 15)\n", + "(2017-07-04 22:42:30)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 22:42:31)<<<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 22:42:31)>>>>>>>>>>>>>>>> Drop OOB data | (5974186, 14)\n", + "(2017-07-04 22:42:34)>>>>>>>>>>>>>>>>>> blood pressure systolic, mmHg, 6177439\n", + "(2017-07-04 22:45:18)<<<<<<<<<<<<<<<<<< --- (164.0s)\n", + "(2017-07-04 22:45:18)>>>>>>>>>>>>>>>>>> blood pressure systolic, cc/min, 153573\n", + "(2017-07-04 22:45:19)<<<<<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 22:45:19)<<<<<<<<<<<<<<<< --- (168.0s)\n", + "Data Loss (Extract > Cleaned): ((6374824, 1), (5974186, 14), 43848L, 174, '0.307% records')\n", + "(2017-07-04 22:45:20)<<<<<<<<<<<<<< --- (508.0s)\n", + "(2017-07-04 22:45:20)>>>>>>>>>>>>>> Filter & sort - (5974186, 14)\n", + "(2017-07-04 22:45:23)<<<<<<<<<<<<<< --- (3.0s)\n", + "(2017-07-04 22:45:23)>>>>>>>>>>>>>> Convert to dask - (5974186, 14)\n", + "(2017-07-04 22:45:25)<<<<<<<<<<<<<< --- (2.0s)\n", + "(2017-07-04 22:45:25)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 22:45:25)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:45:25)<<<<<<<<<<<< --- (709.0s)\n", + "(2017-07-04 22:45:25)>>>>>>>>>>>> BLOOD PRESSURE DIASTOLIC: 3/8\n", + "(2017-07-04 22:45:25)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 22:45:25)>>>>>>>>>>>>>>>> Extracting 16 items from chartevents\n", + "(2017-07-04 22:48:00)<<<<<<<<<<<<<<<< --- (155.0s)\n", + "(2017-07-04 22:48:00)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 22:48:00)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:48:00)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 22:48:06)<<<<<<<<<<<<<<<< --- (6.0s)\n", + "(2017-07-04 22:48:06)<<<<<<<<<<<<<< --- (161.0s)\n", + "(2017-07-04 22:48:06)>>>>>>>>>>>>>> Transforming... (6371282, 5)\n", + "Data Loss (Extract > Transformed): ((6371282, 1), (5976845, 17), 24410L, 170, '0.2999% records')\n", + "(2017-07-04 22:49:52)<<<<<<<<<<<<<< --- (106.0s)\n", + "(2017-07-04 22:49:52)>>>>>>>>>>>>>> Cleaning... (5976845, 17)\n", + "(2017-07-04 22:56:05)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 22:56:06)<<<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 22:56:06)>>>>>>>>>>>>>>>> Drop OOB data | (5976313, 16)\n", + "(2017-07-04 22:56:10)>>>>>>>>>>>>>>>>>> blood pressure diastolic, mmHg, 6194656\n", + "(2017-07-04 22:59:39)<<<<<<<<<<<<<<<<<< --- (209.0s)\n", + "(2017-07-04 22:59:39)>>>>>>>>>>>>>>>>>> blood pressure diastolic, cc/min, 151640\n", + "(2017-07-04 22:59:39)<<<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:59:39)<<<<<<<<<<<<<<<< --- (213.0s)\n", + "Data Loss (Extract > Cleaned): ((6371282, 1), (5976313, 16), 25238L, 170, '0.2999% records')\n", + "(2017-07-04 22:59:41)<<<<<<<<<<<<<< --- (589.0s)\n", + "(2017-07-04 22:59:41)>>>>>>>>>>>>>> Filter & sort - (5976313, 16)\n", + "(2017-07-04 22:59:45)<<<<<<<<<<<<<< --- (4.0s)\n", + "(2017-07-04 22:59:45)>>>>>>>>>>>>>> Convert to dask - (5976313, 16)\n", + "(2017-07-04 22:59:46)<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 22:59:46)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 22:59:46)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 22:59:46)<<<<<<<<<<<< --- (861.0s)\n", + "(2017-07-04 22:59:46)>>>>>>>>>>>> BLOOD PRESSURE MEAN: 4/8\n", + "(2017-07-04 22:59:46)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 22:59:46)>>>>>>>>>>>>>>>> Extracting 3 items from chartevents\n", + "(2017-07-04 23:00:18)<<<<<<<<<<<<<<<< --- (32.0s)\n", + "(2017-07-04 23:00:18)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 23:00:19)<<<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 23:00:19)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 23:00:20)<<<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 23:00:20)<<<<<<<<<<<<<< --- (34.0s)\n", + "(2017-07-04 23:00:20)>>>>>>>>>>>>>> Transforming... (2536271, 5)\n", + "Data Loss (Extract > Transformed): ((2536271, 1), (2416029, 3), 0L, 0, '0.0% records')\n", + "(2017-07-04 23:01:04)<<<<<<<<<<<<<< --- (44.0s)\n", + "(2017-07-04 23:01:04)>>>>>>>>>>>>>> Cleaning... (2416029, 3)\n", + "(2017-07-04 23:01:19)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 23:01:19)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:01:19)>>>>>>>>>>>>>>>> Drop OOB data | (2415995, 3)\n", + "(2017-07-04 23:01:20)>>>>>>>>>>>>>>>>>> blood pressure mean, mmHg, 2536236\n", + "(2017-07-04 23:01:55)<<<<<<<<<<<<<<<<<< --- (35.0s)\n", + "(2017-07-04 23:01:55)<<<<<<<<<<<<<<<< --- (36.0s)\n", + "Data Loss (Extract > Cleaned): ((2536271, 1), (2415995, 3), 1873L, 0, '0.0% records')\n", + "(2017-07-04 23:01:55)<<<<<<<<<<<<<< --- (51.0s)\n", + "(2017-07-04 23:01:55)>>>>>>>>>>>>>> Filter & sort - (2415995, 3)\n", + "(2017-07-04 23:01:56)<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 23:01:56)>>>>>>>>>>>>>> Convert to dask - (2415995, 3)\n", + "(2017-07-04 23:01:57)<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 23:01:57)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 23:01:57)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:01:57)<<<<<<<<<<<< --- (131.0s)\n", + "(2017-07-04 23:01:57)>>>>>>>>>>>> RESPIRATORY RATE: 5/8\n", + "(2017-07-04 23:01:57)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 23:01:57)>>>>>>>>>>>>>>>> Extracting 4 items from chartevents\n", + "(2017-07-04 23:06:09)<<<<<<<<<<<<<<<< --- (252.0s)\n", + "(2017-07-04 23:06:09)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 23:06:09)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:06:09)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 23:06:24)<<<<<<<<<<<<<<<< --- (15.0s)\n", + "(2017-07-04 23:06:24)<<<<<<<<<<<<<< --- (267.0s)\n", + "(2017-07-04 23:06:24)>>>>>>>>>>>>>> Transforming... (7810019, 5)\n", + "Data Loss (Extract > Transformed): ((7810019, 1), (7780717, 5), 28707L, 172, '0.3035% records')\n", + "(2017-07-04 23:08:13)<<<<<<<<<<<<<< --- (109.0s)\n", + "(2017-07-04 23:08:13)>>>>>>>>>>>>>> Cleaning... (7780717, 5)\n", + "(2017-07-04 23:11:07)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 23:11:07)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:11:07)>>>>>>>>>>>>>>>> Drop OOB data | (7780015, 4)\n", + "(2017-07-04 23:11:11)>>>>>>>>>>>>>>>>>> respiratory rate, insp/min, 6108262\n", + "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<<<< --- (57.0s)\n", + "(2017-07-04 23:12:08)>>>>>>>>>>>>>>>>>> respiratory rate, Breath, 1671901\n", + "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:12:08)>>>>>>>>>>>>>>>>>> respiratory rate, no_units, 2\n", + "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<< --- (61.0s)\n", + "Data Loss (Extract > Cleaned): ((7810019, 1), (7780015, 4), 29907L, 172, '0.3035% records')\n", + "(2017-07-04 23:12:09)<<<<<<<<<<<<<< --- (236.0s)\n", + "(2017-07-04 23:12:10)>>>>>>>>>>>>>> Filter & sort - (7780015, 4)\n", + "(2017-07-04 23:12:14)<<<<<<<<<<<<<< --- (4.0s)\n", + "(2017-07-04 23:12:14)>>>>>>>>>>>>>> Convert to dask - (7780015, 4)\n", + "(2017-07-04 23:12:14)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:12:14)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 23:12:14)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:12:14)<<<<<<<<<<<< --- (617.0s)\n", + "(2017-07-04 23:12:14)>>>>>>>>>>>> TEMPERATURE BODY: 6/8\n", + "(2017-07-04 23:12:15)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 23:12:15)>>>>>>>>>>>>>>>> Extracting 4 items from chartevents\n", + "(2017-07-04 23:13:06)<<<<<<<<<<<<<<<< --- (51.0s)\n", + "(2017-07-04 23:13:06)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 23:13:06)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:13:06)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 23:13:11)<<<<<<<<<<<<<<<< --- (5.0s)\n", + "(2017-07-04 23:13:11)<<<<<<<<<<<<<< --- (56.0s)\n", + "(2017-07-04 23:13:11)>>>>>>>>>>>>>> Transforming... (1751447, 5)\n", + "Data Loss (Extract > Transformed): ((1751447, 1), (1731875, 4), 16612L, 156, '0.3189% records')\n", + "(2017-07-04 23:13:42)<<<<<<<<<<<<<< --- (31.0s)\n", + "(2017-07-04 23:13:42)>>>>>>>>>>>>>> Cleaning... (1731875, 4)\n", + "(2017-07-04 23:13:54)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 23:13:54)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:13:54)>>>>>>>>>>>>>>>> Drop OOB data | (1731794, 4)\n", + "(2017-07-04 23:13:55)>>>>>>>>>>>>>>>>>> temperature body, degF, 1734754\n", + "(2017-07-04 23:14:24)<<<<<<<<<<<<<<<<<< --- (29.0s)\n", + "(2017-07-04 23:14:24)<<<<<<<<<<<<<<<< --- (30.0s)\n", + "Data Loss (Extract > Cleaned): ((1751447, 1), (1731794, 4), 17226L, 156, '0.3189% records')\n", + "(2017-07-04 23:14:24)<<<<<<<<<<<<<< --- (42.0s)\n", + "(2017-07-04 23:14:24)>>>>>>>>>>>>>> Filter & sort - (1731794, 4)\n", + "(2017-07-04 23:14:25)<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 23:14:25)>>>>>>>>>>>>>> Convert to dask - (1731794, 4)\n", + "(2017-07-04 23:14:25)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:14:25)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 23:14:25)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:14:25)<<<<<<<<<<<< --- (131.0s)\n", + "(2017-07-04 23:14:25)>>>>>>>>>>>> OXYGEN SATURATION PULSE OXIMETRY: 7/8\n", + "(2017-07-04 23:14:25)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 23:14:25)>>>>>>>>>>>>>>>> Extracting 2 items from chartevents\n", + "(2017-07-04 23:15:41)<<<<<<<<<<<<<<<< --- (76.0s)\n", + "(2017-07-04 23:15:41)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 23:15:41)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:15:41)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 23:15:58)<<<<<<<<<<<<<<<< --- (17.0s)\n", + "(2017-07-04 23:15:58)<<<<<<<<<<<<<< --- (93.0s)\n", + "(2017-07-04 23:15:58)>>>>>>>>>>>>>> Transforming... (6099827, 5)\n", + "Data Loss (Extract > Transformed): ((6099827, 1), (6073540, 2), 26134L, 163, '0.3326% records')\n", + "(2017-07-04 23:17:28)<<<<<<<<<<<<<< --- (90.0s)\n", + "(2017-07-04 23:17:28)>>>>>>>>>>>>>> Cleaning... (6073540, 2)\n", + "(2017-07-04 23:18:01)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 23:18:01)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:18:01)>>>>>>>>>>>>>>>> Drop OOB data | (6073019, 2)\n", + "(2017-07-04 23:18:03)>>>>>>>>>>>>>>>>>> oxygen saturation pulse oximetry, percent, 6073172\n", + "(2017-07-04 23:18:54)<<<<<<<<<<<<<<<<<< --- (51.0s)\n", + "(2017-07-04 23:18:54)<<<<<<<<<<<<<<<< --- (53.0s)\n", + "Data Loss (Extract > Cleaned): ((6099827, 1), (6073019, 2), 26707L, 163, '0.3326% records')\n", + "(2017-07-04 23:18:55)<<<<<<<<<<<<<< --- (87.0s)\n", + "(2017-07-04 23:18:56)>>>>>>>>>>>>>> Filter & sort - (6073019, 2)\n", + "(2017-07-04 23:18:58)<<<<<<<<<<<<<< --- (2.0s)\n", + "(2017-07-04 23:18:58)>>>>>>>>>>>>>> Convert to dask - (6073019, 2)\n", + "(2017-07-04 23:18:59)<<<<<<<<<<<<<< --- (1.0s)\n", + "(2017-07-04 23:18:59)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 23:18:59)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:18:59)<<<<<<<<<<<< --- (274.0s)\n", + "(2017-07-04 23:18:59)>>>>>>>>>>>> WEIGHT BODY: 8/8\n", + "(2017-07-04 23:18:59)>>>>>>>>>>>>>> Extracting...\n", + "(2017-07-04 23:18:59)>>>>>>>>>>>>>>>> Extracting 3 items from chartevents\n", + "(2017-07-04 23:19:34)<<<<<<<<<<<<<<<< --- (35.0s)\n", + "(2017-07-04 23:19:34)>>>>>>>>>>>>>>>> Combine DF\n", + "(2017-07-04 23:19:34)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:19:34)>>>>>>>>>>>>>>>> Clean UOM\n", + "(2017-07-04 23:19:34)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:19:34)<<<<<<<<<<<<<< --- (35.0s)\n", + "(2017-07-04 23:19:34)>>>>>>>>>>>>>> Transforming... (95425, 5)\n", + "Data Loss (Extract > Transformed): ((95425, 1), (94484, 3), 941L, 158, '0.4958% records')\n", + "(2017-07-04 23:19:36)<<<<<<<<<<<<<< --- (2.0s)\n", + "(2017-07-04 23:19:36)>>>>>>>>>>>>>> Cleaning... (94484, 3)\n", + "(2017-07-04 23:19:37)>>>>>>>>>>>>>>>> Nominal to OneHot\n", + "(2017-07-04 23:19:37)<<<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:19:37)>>>>>>>>>>>>>>>> Drop OOB data | (94457, 3)\n", + "(2017-07-04 23:19:37)>>>>>>>>>>>>>>>>>> weight body, kg, 94457\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<<<<<<<< --- (5.0s)\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<<<<<< --- (5.0s)\n", + "Data Loss (Extract > Cleaned): ((95425, 1), (94457, 3), 979L, 158, '0.4958% records')\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (6.0s)\n", + "(2017-07-04 23:19:42)>>>>>>>>>>>>>> Filter & sort - (94457, 3)\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:19:42)>>>>>>>>>>>>>> Convert to dask - (94457, 3)\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:19:42)>>>>>>>>>>>>>> Join to big DF\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (0.0s)\n", + "(2017-07-04 23:19:42)<<<<<<<<<<<< --- (43.0s)\n", + "(2017-07-04 23:19:42)<<<<<<<<<< --- (3087.0s)\n", + "(2017-07-04 23:19:42)<<<<<<<< --- (3087.0s)\n" + ] + } + ], + "source": [ + "df_all = mimic.ETL(mimic.mimic_extractor('config/mimic_item_map.csv',data_dict),\n", + " components,\n", + " data_dict,\n", + " transformers.same_index_aggregator(agg_func=lambda x:x.iloc[0]))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Get all of the data we want and join into a single DF" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import utils\n", + "import logger\n", + "import transformers\n", + "import warnings\n", + "warnings.filterwarnings('ignore')\n", + "\n", + "def get_big_df(hdf5_fname,components):\n", + " \n", + " df_all = None\n", + " logger.log('Make DF for {} components...\\n{}'.format(len(components),'\\n'.join(components)),new_level=True)\n", + " for component in components:\n", + " logger.log('{}: {}/{}'.format(component.upper(),components.index(component)+1,len(components)),new_level=True)\n", + "\n", + " logger.log('Opening...')\n", + " df = utils.open_df(hdf5_fname,'cleaned/{}'.format(component)).sort_index(axis=1).sort_index()\n", + " display(df.describe(include='all'))\n", + "\n", + " df_cleaned = transformers.remove_small_columns(threshold=5).fit_transform(df)\n", + " \n", + " display(df_cleaned.describe(include='all'))\n", + "\n", + " print utils.data_loss(df,df_cleaned)\n", + " \n", + " logger.log('Join {} to {}'.format(df_cleaned.shape, None if df_all is None else df_all.shape))\n", + " if df_all is None: df_all = df_cleaned\n", + " else : \n", + " df_all = df_all.join(df_cleaned,how='outer')\n", + " del df,df_cleaned\n", + " \n", + " logger.end_log_level()\n", + " logger.end_log()\n", + "\n", + " return df_all" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "import icu_data_defs\n", + "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "components = data_dict.get_panel_defintions(12).component.unique().tolist()\n", + "components" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "#everything up to urine output\n", + "df1 = get_big_df('data/mimic_data',components[:8])\n", + "utils.save_df(df1,'data/mimic_data','cleaned/part1')\n", + "\n", + "#urine output and forward\n", + "df2 = get_big_df('data/mimic_data',components[8:])\n", + "utils.save_df(df2,'data/mimic_data','cleaned/part2')\n", + "\n", + "df_combined = df1.join(df2,how='outer')\n", + "\n", + "del df1,df2\n", + "df_all.shape" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "utils.save_df(df_combined,'data/mimic_data','cleaned/all')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Start here" + ] + }, + { + "cell_type": "code", + "execution_count": 70, + "metadata": { + "collapsed": false + }, + "outputs": [], + "source": [ + "\n", + "\n", + "def summable_filter(df):\n", + " ureg = units.MedicalUreg()\n", + " filter_func= lambda x: (ureg.is_volume(str(x[-2])) or ureg.is_mass(str(x[-2]))) and (x[0] != data_dict.labels.WEIGHT_BODY)\n", + " return df.loc[:,df.columns.map(filter_func)]\n", + "\n", + "def lactate_filter_admissions(hdf5_fname)\n", + "\n", + "def make_lactate_labels(hdf5_fname,custom_cleaners,data_dict):\n", + " df = utils.open_df(hdf5_fname,'cleaned/{}'.format(data_dict.labels.LACTATE))\n", + " df_cleaned = custom_cleaners.transform(df)\n", + " max_col_cleaner = transformers.max_col_only()\n", + " df_cleaned = max_col_cleaner.transform(df_cleaned)\n", + " df_cleaned.groupby(level=constants.column_names.ID).agg(lambda x: x.iloc[])\n", + " \n", + " \n", + "\n", + "basic_feature_tuples = [\n", + " ('MEAN',features.segment_mean(),constants.ALL),\n", + " ('STD',features.segment_std(),constants.ALL),\n", + " ('COUNT',features.segment_count(),constants.ALL),\n", + " ('LAST',features.segment_last(),constants.ALL),\n", + " ('SUM',features.segment_sum(),{constants.CUSTOM_FILTER:summable_filter})\n", + "]\n", + "\n", + "custom_cleaners = Pipeline([\n", + " ('drop_oob_values',transformers.oob_value_remover(data_dict)),\n", + " ('drop_small_columns',transformers.remove_small_columns(threshold=50)),\n", + " ('combine_like_columns',transformers.combine_like_cols()),\n", + "# ('quantitative_only',transformers.filter_var_type(var_types_to_keep)),\n", + "# ('known_col_only',transformers.known_col_only()),\n", + " ])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [ + "\n", + "\n", + "lactate_labels = make_lactate_labels(hdf5_fname,custom_cleaners)\n", + "\n", + "df_features = mimic_features(hdf5_fname,'basic_all_before',labels,custom_cleaners)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "collapsed": true + }, + "outputs": [], + "source": [] + } + ], + "metadata": { + "anaconda-cloud": {}, + "kernelspec": { + "display_name": "Python [Root]", + "language": "python", + "name": "Python [Root]" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 2 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython2", + "version": "2.7.12" + } + }, + "nbformat": 4, + "nbformat_minor": 0 +}