--- a
+++ b/1_simple_data.ipynb
@@ -0,0 +1,33087 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "%matplotlib inline\n",
+    "from IPython.display import display, HTML"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Build Data Definitions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import icu_data_defs"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>units</th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>clinical_source</th>\n",
+       "      <th>list_id</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>def_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>heart rate</td>\n",
+       "      <td>beats/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>blood pressure systolic</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>blood pressure diastolic</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>blood pressure mean</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>respiratory rate</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                           label      units variable_type clinical_source  \\\n",
+       "def_id                                                                      \n",
+       "0                     heart rate  beats/min            qn     observation   \n",
+       "1        blood pressure systolic       mmHg            qn     observation   \n",
+       "2       blood pressure diastolic       mmHg            qn     observation   \n",
+       "3            blood pressure mean       mmHg            qn     observation   \n",
+       "4               respiratory rate   insp/min            qn     observation   \n",
+       "\n",
+       "        list_id  \n",
+       "def_id           \n",
+       "0           NaN  \n",
+       "1           NaN  \n",
+       "2           NaN  \n",
+       "3           NaN  \n",
+       "4           NaN  "
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data_dict.tables.definitions.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 29,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "inr_id = data_dict.add_definition(label='INR')\n",
+    "pt_id = data_dict.add_definition(label='Prothrombin Time',units='seconds')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 30,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>units</th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>clinical_source</th>\n",
+       "      <th>list_id</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>def_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>23</th>\n",
+       "      <td>lactate</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>24</th>\n",
+       "      <td>lactate</td>\n",
+       "      <td>mg/dL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25</th>\n",
+       "      <td>hemoglobin</td>\n",
+       "      <td>g/dL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>26</th>\n",
+       "      <td>INR</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>27</th>\n",
+       "      <td>Prothrombin Time</td>\n",
+       "      <td>seconds</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                   label    units variable_type clinical_source  list_id\n",
+       "def_id                                                                  \n",
+       "23               lactate   mmol/L            qn     observation      NaN\n",
+       "24               lactate    mg/dL            qn     observation      NaN\n",
+       "25            hemoglobin     g/dL            qn     observation      NaN\n",
+       "26                   INR      NaN            qn     observation      NaN\n",
+       "27      Prothrombin Time  seconds            qn     observation      NaN"
+      ]
+     },
+     "execution_count": 30,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data_dict.tables.definitions.tail()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 31,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>units</th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>clinical_source</th>\n",
+       "      <th>list_id</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>def_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>26</th>\n",
+       "      <td>INR</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>27</th>\n",
+       "      <td>Prothrombin Time</td>\n",
+       "      <td>seconds</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                   label    units variable_type clinical_source  list_id\n",
+       "def_id                                                                  \n",
+       "26                   INR      NaN            qn     observation      NaN\n",
+       "27      Prothrombin Time  seconds            qn     observation      NaN"
+      ]
+     },
+     "execution_count": 31,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from itertools import product\n",
+    "\n",
+    "panel_map = list(product([data_dict.table_names.definitions],[inr_id,pt_id]))\n",
+    "panel_id = data_dict.add_panel('coagulation labs',panel_map)\n",
+    "data_dict.get_panel_defintions(panel_id)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 32,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>panel_name</th>\n",
+       "      <th>list_id</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>panel_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>blood pressure</td>\n",
+       "      <td>3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>vital signs</td>\n",
+       "      <td>4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>urine output</td>\n",
+       "      <td>5</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>glasgow coma scale</td>\n",
+       "      <td>6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>normal saline</td>\n",
+       "      <td>7</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>lactated ringers</td>\n",
+       "      <td>8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>common fluids</td>\n",
+       "      <td>9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>norepinephrine</td>\n",
+       "      <td>10</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>vasopressin</td>\n",
+       "      <td>11</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>common pressors</td>\n",
+       "      <td>12</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>lactate</td>\n",
+       "      <td>13</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>oxygen delivery labs</td>\n",
+       "      <td>14</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>simple dataset</td>\n",
+       "      <td>15</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>coagulation labs</td>\n",
+       "      <td>16</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                    panel_name  list_id\n",
+       "panel_id                               \n",
+       "0               blood pressure        3\n",
+       "1                  vital signs        4\n",
+       "2                 urine output        5\n",
+       "3           glasgow coma scale        6\n",
+       "4                normal saline        7\n",
+       "5             lactated ringers        8\n",
+       "6                common fluids        9\n",
+       "7               norepinephrine       10\n",
+       "8                  vasopressin       11\n",
+       "9              common pressors       12\n",
+       "10                     lactate       13\n",
+       "11        oxygen delivery labs       14\n",
+       "12              simple dataset       15\n",
+       "13            coagulation labs       16"
+      ]
+     },
+     "execution_count": 32,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data_dict.tables.panels"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 33,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>units</th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>clinical_source</th>\n",
+       "      <th>list_id</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>def_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>heart rate</td>\n",
+       "      <td>beats/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>blood pressure systolic</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>blood pressure diastolic</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>blood pressure mean</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>respiratory rate</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>temperature body</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>oxygen saturation pulse oximetry</td>\n",
+       "      <td>percent</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>weight body</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>output urine</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>output urine</td>\n",
+       "      <td>mL/hr</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>output urine</td>\n",
+       "      <td>mL/kg/hr</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>glasgow coma scale motor</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>ord</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>glasgow coma scale eye opening</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>ord</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>glasgow coma scale verbal</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>ord</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>14</th>\n",
+       "      <td>normal saline</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>15</th>\n",
+       "      <td>normal saline</td>\n",
+       "      <td>mL/hr</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>16</th>\n",
+       "      <td>lactated ringers</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>17</th>\n",
+       "      <td>lactated ringers</td>\n",
+       "      <td>mL/hr</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>18</th>\n",
+       "      <td>norepinephrine</td>\n",
+       "      <td>mcg</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>19</th>\n",
+       "      <td>norepinephrine</td>\n",
+       "      <td>mcg/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>20</th>\n",
+       "      <td>norepinephrine</td>\n",
+       "      <td>mcg/kg/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>21</th>\n",
+       "      <td>vasopressin</td>\n",
+       "      <td>units</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>22</th>\n",
+       "      <td>vasopressin</td>\n",
+       "      <td>units/min</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>intervention</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25</th>\n",
+       "      <td>hemoglobin</td>\n",
+       "      <td>g/dL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>23</th>\n",
+       "      <td>lactate</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>24</th>\n",
+       "      <td>lactate</td>\n",
+       "      <td>mg/dL</td>\n",
+       "      <td>qn</td>\n",
+       "      <td>observation</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                   label       units variable_type  \\\n",
+       "def_id                                                               \n",
+       "0                             heart rate   beats/min            qn   \n",
+       "1                blood pressure systolic        mmHg            qn   \n",
+       "2               blood pressure diastolic        mmHg            qn   \n",
+       "3                    blood pressure mean        mmHg            qn   \n",
+       "4                       respiratory rate    insp/min            qn   \n",
+       "5                       temperature body        degF            qn   \n",
+       "6       oxygen saturation pulse oximetry     percent            qn   \n",
+       "7                            weight body          kg            qn   \n",
+       "8                           output urine          mL            qn   \n",
+       "9                           output urine       mL/hr            qn   \n",
+       "10                          output urine    mL/kg/hr            qn   \n",
+       "11              glasgow coma scale motor         NaN           ord   \n",
+       "12        glasgow coma scale eye opening         NaN           ord   \n",
+       "13             glasgow coma scale verbal         NaN           ord   \n",
+       "14                         normal saline          mL            qn   \n",
+       "15                         normal saline       mL/hr            qn   \n",
+       "16                      lactated ringers          mL            qn   \n",
+       "17                      lactated ringers       mL/hr            qn   \n",
+       "18                        norepinephrine         mcg            qn   \n",
+       "19                        norepinephrine     mcg/min            qn   \n",
+       "20                        norepinephrine  mcg/kg/min            qn   \n",
+       "21                           vasopressin       units            qn   \n",
+       "22                           vasopressin   units/min            qn   \n",
+       "25                            hemoglobin        g/dL            qn   \n",
+       "23                               lactate      mmol/L            qn   \n",
+       "24                               lactate       mg/dL            qn   \n",
+       "\n",
+       "       clinical_source  list_id  \n",
+       "def_id                           \n",
+       "0          observation      NaN  \n",
+       "1          observation      NaN  \n",
+       "2          observation      NaN  \n",
+       "3          observation      NaN  \n",
+       "4          observation      NaN  \n",
+       "5          observation      NaN  \n",
+       "6          observation      NaN  \n",
+       "7          observation      NaN  \n",
+       "8          observation      NaN  \n",
+       "9          observation      NaN  \n",
+       "10         observation      NaN  \n",
+       "11         observation      0.0  \n",
+       "12         observation      2.0  \n",
+       "13         observation      1.0  \n",
+       "14        intervention      NaN  \n",
+       "15        intervention      NaN  \n",
+       "16        intervention      NaN  \n",
+       "17        intervention      NaN  \n",
+       "18        intervention      NaN  \n",
+       "19        intervention      NaN  \n",
+       "20        intervention      NaN  \n",
+       "21        intervention      NaN  \n",
+       "22        intervention      NaN  \n",
+       "25         observation      NaN  \n",
+       "23         observation      NaN  \n",
+       "24         observation      NaN  "
+      ]
+     },
+     "execution_count": 33,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data_dict.get_panel_defintions(12)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 34,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "data_dict.save()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# MIMIC Exploration"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import mimic\n",
+    "from icu_data_defs import data_dictionary"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "reload(mimic)\n",
+    "conn = mimic.connect()\n",
+    "data_dict = data_dictionary('config/data_definitions.xlsx')\n",
+    "explorer = mimic.explorer(conn)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict = {}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Vital Signs"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Heart Rate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>227018</th>\n",
+       "      <td>HR_ApacheIV</td>\n",
+       "      <td>HR_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223765</th>\n",
+       "      <td>Orthostatic HR sitting</td>\n",
+       "      <td>Orthostatic HR sitting</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1332</th>\n",
+       "      <td>pulse</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227581</th>\n",
+       "      <td>BiPap bpm (S/T -Back up)</td>\n",
+       "      <td>BiPap bpm (S/T -Back up)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220047</th>\n",
+       "      <td>Heart Rate Alarm - Low</td>\n",
+       "      <td>HR Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224363</th>\n",
+       "      <td>VAD Beat Rate L</td>\n",
+       "      <td>VAD Beat Rate L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226764</th>\n",
+       "      <td>HrApacheIIValue</td>\n",
+       "      <td>HrApacheIIValue</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1341</th>\n",
+       "      <td>PULSE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220045</th>\n",
+       "      <td>Heart Rate</td>\n",
+       "      <td>HR</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223775</th>\n",
+       "      <td>VAD Beat Rate R</td>\n",
+       "      <td>VAD Beat Rate R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220046</th>\n",
+       "      <td>Heart rate Alarm - High</td>\n",
+       "      <td>HR Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224751</th>\n",
+       "      <td>Temporary Pacemaker Rate</td>\n",
+       "      <td>Temp Pacemaker Rate</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Cardiovascular (Pacer Data)</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223764</th>\n",
+       "      <td>Orthostatic HR lying</td>\n",
+       "      <td>Orthostatic HR lying</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1725</th>\n",
+       "      <td>Pulse</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224422</th>\n",
+       "      <td>Spont RR</td>\n",
+       "      <td>Spont RR</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224647</th>\n",
+       "      <td>Orthostatic HR standing</td>\n",
+       "      <td>Orthostatic HR standing</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>bpm</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>211</th>\n",
+       "      <td>Heart Rate</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220181</th>\n",
+       "      <td>Non Invasive Blood Pressure mean</td>\n",
+       "      <td>NBPm</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220052</th>\n",
+       "      <td>Arterial Blood Pressure mean</td>\n",
+       "      <td>ABPm</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3494</th>\n",
+       "      <td>Lowest Heart Rate</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>92.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                   label              abbreviation  \\\n",
+       "itemid                                                               \n",
+       "227018                       HR_ApacheIV               HR_ApacheIV   \n",
+       "223765            Orthostatic HR sitting    Orthostatic HR sitting   \n",
+       "1332                               pulse                             \n",
+       "227581          BiPap bpm (S/T -Back up)  BiPap bpm (S/T -Back up)   \n",
+       "220047            Heart Rate Alarm - Low            HR Alarm - Low   \n",
+       "224363                   VAD Beat Rate L           VAD Beat Rate L   \n",
+       "226764                   HrApacheIIValue           HrApacheIIValue   \n",
+       "1341                               PULSE                             \n",
+       "220045                        Heart Rate                        HR   \n",
+       "223775                   VAD Beat Rate R           VAD Beat Rate R   \n",
+       "220046           Heart rate Alarm - High           HR Alarm - High   \n",
+       "224751          Temporary Pacemaker Rate       Temp Pacemaker Rate   \n",
+       "223764              Orthostatic HR lying      Orthostatic HR lying   \n",
+       "1725                               Pulse                             \n",
+       "224422                          Spont RR                  Spont RR   \n",
+       "224647           Orthostatic HR standing   Orthostatic HR standing   \n",
+       "211                           Heart Rate                             \n",
+       "220181  Non Invasive Blood Pressure mean                      NBPm   \n",
+       "220052      Arterial Blood Pressure mean                      ABPm   \n",
+       "3494                   Lowest Heart Rate                             \n",
+       "\n",
+       "            linksto                     category unitname       score  \n",
+       "itemid                                                                 \n",
+       "227018  chartevents       Scores - APACHE IV (2)      bpm  110.000000  \n",
+       "223765  chartevents          Routine Vital Signs      bpm  110.000000  \n",
+       "1332    chartevents                                        110.000000  \n",
+       "227581  chartevents                  Respiratory      bpm  110.000000  \n",
+       "220047  chartevents                       Alarms      bpm  110.000000  \n",
+       "224363  chartevents                 Hemodynamics      bpm  110.000000  \n",
+       "226764  chartevents           Scores - APACHE II      bpm  110.000000  \n",
+       "1341    chartevents                                        110.000000  \n",
+       "220045  chartevents          Routine Vital Signs      bpm  110.000000  \n",
+       "223775  chartevents                 Hemodynamics      bpm  110.000000  \n",
+       "220046  chartevents                       Alarms      bpm  110.000000  \n",
+       "224751  chartevents  Cardiovascular (Pacer Data)      bpm  110.000000  \n",
+       "223764  chartevents          Routine Vital Signs      bpm  110.000000  \n",
+       "1725    chartevents                                        110.000000  \n",
+       "224422  chartevents                  Respiratory      bpm  110.000000  \n",
+       "224647  chartevents          Routine Vital Signs      bpm  110.000000  \n",
+       "211     chartevents                                        110.000000  \n",
+       "220181  chartevents          Routine Vital Signs     mmHg  100.666667  \n",
+       "220052  chartevents          Routine Vital Signs     mmHg  100.666667  \n",
+       "3494    chartevents                                         92.666667  "
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'heart rate',\n",
+    "        'beats',\n",
+    "        'bpm',\n",
+    "        'pulse'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "label = data_dict.labels.HEART_RATE\n",
+    "keep_dict[label] = [211,220045,1341,1725,1332]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Respiratory Rate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 66,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>3603</th>\n",
+       "      <td>Resp Rate</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224688</th>\n",
+       "      <td>Respiratory Rate (Set)</td>\n",
+       "      <td>Respiratory Rate (Set)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226774</th>\n",
+       "      <td>RRApacheIIValue</td>\n",
+       "      <td>RRApacheIIValue</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>618</th>\n",
+       "      <td>Respiratory Rate</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224690</th>\n",
+       "      <td>Respiratory Rate (Total)</td>\n",
+       "      <td>Respiratory Rate (Total)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223875</th>\n",
+       "      <td>Fspn High</td>\n",
+       "      <td>Fspn High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224689</th>\n",
+       "      <td>Respiratory Rate (spontaneous)</td>\n",
+       "      <td>Respiratory Rate (spontaneous)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220210</th>\n",
+       "      <td>Respiratory Rate</td>\n",
+       "      <td>RR</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224161</th>\n",
+       "      <td>Resp Alarm - High</td>\n",
+       "      <td>Resp Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227050</th>\n",
+       "      <td>RR_ApacheIV</td>\n",
+       "      <td>RR_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224162</th>\n",
+       "      <td>Resp Alarm - Low</td>\n",
+       "      <td>Resp Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>insp/min</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>619</th>\n",
+       "      <td>Respiratory Rate Set</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>102.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225949</th>\n",
+       "      <td>NIV Mask</td>\n",
+       "      <td>NIV Mask</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223840</th>\n",
+       "      <td>ETT Re-taped</td>\n",
+       "      <td>ETT Re-taped</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223838</th>\n",
+       "      <td>ETT Location</td>\n",
+       "      <td>ETT Location</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223837</th>\n",
+       "      <td>ETT Size (ID)</td>\n",
+       "      <td>ETT Size (ID)</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224373</th>\n",
+       "      <td>Sputum Amount</td>\n",
+       "      <td>Sputum Amount</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223836</th>\n",
+       "      <td>Airway Type</td>\n",
+       "      <td>Airway Type</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226815</th>\n",
+       "      <td>Airway problems</td>\n",
+       "      <td>Airway problems</td>\n",
+       "      <td></td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223835</th>\n",
+       "      <td>Inspired O2 Fraction</td>\n",
+       "      <td>FiO2</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>None</td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                 label                    abbreviation  \\\n",
+       "itemid                                                                   \n",
+       "3603                         Resp Rate                                   \n",
+       "224688          Respiratory Rate (Set)          Respiratory Rate (Set)   \n",
+       "226774                 RRApacheIIValue                 RRApacheIIValue   \n",
+       "618                   Respiratory Rate                                   \n",
+       "224690        Respiratory Rate (Total)        Respiratory Rate (Total)   \n",
+       "223875                       Fspn High                       Fspn High   \n",
+       "224689  Respiratory Rate (spontaneous)  Respiratory Rate (spontaneous)   \n",
+       "220210                Respiratory Rate                              RR   \n",
+       "224161               Resp Alarm - High               Resp Alarm - High   \n",
+       "227050                     RR_ApacheIV                     RR_ApacheIV   \n",
+       "224162                Resp Alarm - Low                Resp Alarm - Low   \n",
+       "619               Respiratory Rate Set                                   \n",
+       "225949                        NIV Mask                        NIV Mask   \n",
+       "223840                    ETT Re-taped                    ETT Re-taped   \n",
+       "223838                    ETT Location                    ETT Location   \n",
+       "223837                   ETT Size (ID)                   ETT Size (ID)   \n",
+       "224373                   Sputum Amount                   Sputum Amount   \n",
+       "223836                     Airway Type                     Airway Type   \n",
+       "226815                 Airway problems                 Airway problems   \n",
+       "223835            Inspired O2 Fraction                            FiO2   \n",
+       "\n",
+       "            linksto                category  unitname       score  \n",
+       "itemid                                                             \n",
+       "3603    chartevents                                    110.000000  \n",
+       "224688  chartevents             Respiratory  insp/min  110.000000  \n",
+       "226774  chartevents      Scores - APACHE II  insp/min  110.000000  \n",
+       "618     chartevents                                    110.000000  \n",
+       "224690  chartevents             Respiratory  insp/min  110.000000  \n",
+       "223875  chartevents             Respiratory  insp/min  110.000000  \n",
+       "224689  chartevents             Respiratory  insp/min  110.000000  \n",
+       "220210  chartevents             Respiratory  insp/min  110.000000  \n",
+       "224161  chartevents                  Alarms  insp/min  110.000000  \n",
+       "227050  chartevents  Scores - APACHE IV (2)  insp/min  110.000000  \n",
+       "224162  chartevents                  Alarms  insp/min  110.000000  \n",
+       "619     chartevents                                    102.666667  \n",
+       "225949                          Respiratory             97.333333  \n",
+       "223840                          Respiratory             97.333333  \n",
+       "223838                          Respiratory             97.333333  \n",
+       "223837                          Respiratory             97.333333  \n",
+       "224373                          Respiratory             97.333333  \n",
+       "223836                          Respiratory             97.333333  \n",
+       "226815                          Respiratory             97.333333  \n",
+       "223835  chartevents             Respiratory      None   97.333333  "
+      ]
+     },
+     "execution_count": 66,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'respiratory rate',\n",
+    "        'resp rate',\n",
+    "        'insp/min',\n",
+    "        'breath/min'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 67,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "label = data_dict.labels.RESPIRATORY_RATE\n",
+    "keep_dict[label] = [220210,3603,618,8113,615,219]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Blood Pressure"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 68,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>224315</th>\n",
+       "      <td>ABI Brachial BP L</td>\n",
+       "      <td>ABI Brachial BP L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227537</th>\n",
+       "      <td>ART Blood Pressure Alarm - High</td>\n",
+       "      <td>ART BP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220181</th>\n",
+       "      <td>Non Invasive Blood Pressure mean</td>\n",
+       "      <td>NBPm</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220180</th>\n",
+       "      <td>Non Invasive Blood Pressure diastolic</td>\n",
+       "      <td>NBPd</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220179</th>\n",
+       "      <td>Non Invasive Blood Pressure systolic</td>\n",
+       "      <td>NBPs</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220074</th>\n",
+       "      <td>Central Venous Pressure</td>\n",
+       "      <td>CVP</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220073</th>\n",
+       "      <td>Central Venous Pressure  Alarm - Low</td>\n",
+       "      <td>CVP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220072</th>\n",
+       "      <td>Central Venous Pressure Alarm - High</td>\n",
+       "      <td>CVP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220069</th>\n",
+       "      <td>Left Artrial Pressure</td>\n",
+       "      <td>LAP</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220066</th>\n",
+       "      <td>Pulmonary Artery Pressure Alarm - Low</td>\n",
+       "      <td>PAP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220063</th>\n",
+       "      <td>Pulmonary Artery Pressure Alarm - High</td>\n",
+       "      <td>PAP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220061</th>\n",
+       "      <td>Pulmonary Artery Pressure mean</td>\n",
+       "      <td>PAPm</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220060</th>\n",
+       "      <td>Pulmonary Artery Pressure diastolic</td>\n",
+       "      <td>PAPd</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220059</th>\n",
+       "      <td>Pulmonary Artery Pressure systolic</td>\n",
+       "      <td>PAPs</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220058</th>\n",
+       "      <td>Arterial Blood Pressure Alarm - High</td>\n",
+       "      <td>ABP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227538</th>\n",
+       "      <td>ART Blood Pressure Alarm - Low</td>\n",
+       "      <td>ART BP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226096</th>\n",
+       "      <td>Orthostatic BPd standing</td>\n",
+       "      <td>Orthostatic BPd standing</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224152</th>\n",
+       "      <td>Return Pressure</td>\n",
+       "      <td>Return Pressure</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Dialysis</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227066</th>\n",
+       "      <td>Cerebral Perfusion Pressure</td>\n",
+       "      <td>CPP</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226062</th>\n",
+       "      <td>Venous CO2 Pressure</td>\n",
+       "      <td>PCO2 (Venous)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                         label              abbreviation  \\\n",
+       "itemid                                                                     \n",
+       "224315                       ABI Brachial BP L         ABI Brachial BP L   \n",
+       "227537         ART Blood Pressure Alarm - High       ART BP Alarm - High   \n",
+       "220181        Non Invasive Blood Pressure mean                      NBPm   \n",
+       "220180   Non Invasive Blood Pressure diastolic                      NBPd   \n",
+       "220179    Non Invasive Blood Pressure systolic                      NBPs   \n",
+       "220074                 Central Venous Pressure                       CVP   \n",
+       "220073    Central Venous Pressure  Alarm - Low           CVP Alarm - Low   \n",
+       "220072    Central Venous Pressure Alarm - High          CVP Alarm - High   \n",
+       "220069                   Left Artrial Pressure                       LAP   \n",
+       "220066   Pulmonary Artery Pressure Alarm - Low           PAP Alarm - Low   \n",
+       "220063  Pulmonary Artery Pressure Alarm - High          PAP Alarm - High   \n",
+       "220061          Pulmonary Artery Pressure mean                      PAPm   \n",
+       "220060     Pulmonary Artery Pressure diastolic                      PAPd   \n",
+       "220059      Pulmonary Artery Pressure systolic                      PAPs   \n",
+       "220058    Arterial Blood Pressure Alarm - High          ABP Alarm - High   \n",
+       "227538          ART Blood Pressure Alarm - Low        ART BP Alarm - Low   \n",
+       "226096                Orthostatic BPd standing  Orthostatic BPd standing   \n",
+       "224152                         Return Pressure           Return Pressure   \n",
+       "227066             Cerebral Perfusion Pressure                       CPP   \n",
+       "226062                     Venous CO2 Pressure             PCO2 (Venous)   \n",
+       "\n",
+       "            linksto             category unitname  score  \n",
+       "itemid                                                    \n",
+       "224315  chartevents                 IABP     mmHg  110.0  \n",
+       "227537  chartevents               Alarms     mmHg  110.0  \n",
+       "220181  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "220180  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "220179  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "220074  chartevents         Hemodynamics     mmHg  110.0  \n",
+       "220073  chartevents               Alarms     mmHg  110.0  \n",
+       "220072  chartevents               Alarms     mmHg  110.0  \n",
+       "220069  chartevents         Hemodynamics     mmHg  110.0  \n",
+       "220066  chartevents               Alarms     mmHg  110.0  \n",
+       "220063  chartevents               Alarms     mmHg  110.0  \n",
+       "220061  chartevents         Hemodynamics     mmHg  110.0  \n",
+       "220060  chartevents         Hemodynamics     mmHg  110.0  \n",
+       "220059  chartevents         Hemodynamics     mmHg  110.0  \n",
+       "220058  chartevents               Alarms     mmHg  110.0  \n",
+       "227538  chartevents               Alarms     mmHg  110.0  \n",
+       "226096  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "224152  chartevents             Dialysis     mmHg  110.0  \n",
+       "227066  chartevents         Hemodynamics     mmHg  110.0  \n",
+       "226062  chartevents                 Labs     mmHg  110.0  "
+      ]
+     },
+     "execution_count": 68,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'blood pressure',\n",
+    "        'systolic',\n",
+    "        'diastolic',\n",
+    "        'mmHg'\n",
+    "    ])\n",
+    "out_df.iloc[0:20]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 69,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>226063</th>\n",
+       "      <td>Venous O2 Pressure</td>\n",
+       "      <td>PO2 (Venous)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225312</th>\n",
+       "      <td>ART BP mean</td>\n",
+       "      <td>ART BP mean</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225310</th>\n",
+       "      <td>ART BP Diastolic</td>\n",
+       "      <td>ART BP Diastolic</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225309</th>\n",
+       "      <td>ART BP Systolic</td>\n",
+       "      <td>ART BP Systolic</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223751</th>\n",
+       "      <td>Non-Invasive Blood Pressure Alarm - High</td>\n",
+       "      <td>NBP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227516</th>\n",
+       "      <td>PO2 (Mixed Venous)</td>\n",
+       "      <td>PO2 (Mixed Venous)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224166</th>\n",
+       "      <td>Doppler BP</td>\n",
+       "      <td>Doppler BP</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224167</th>\n",
+       "      <td>Manual Blood Pressure Systolic Left</td>\n",
+       "      <td>Manual BPs L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226737</th>\n",
+       "      <td>AaDO2ApacheIIValue</td>\n",
+       "      <td>AaDO2ApacheIIValue</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228148</th>\n",
+       "      <td>ABI Ankle BP R (Impella)</td>\n",
+       "      <td>ABI Ankle BP R (Impella)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220224</th>\n",
+       "      <td>Arterial O2 pressure</td>\n",
+       "      <td>PO2 (Arterial)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220235</th>\n",
+       "      <td>Arterial CO2 Pressure</td>\n",
+       "      <td>PCO2 (Arterial)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223752</th>\n",
+       "      <td>Non-Invasive Blood Pressure Alarm - Low</td>\n",
+       "      <td>NBP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223763</th>\n",
+       "      <td>Bladder Pressure</td>\n",
+       "      <td>Bladder Pressure</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224150</th>\n",
+       "      <td>Filter Pressure</td>\n",
+       "      <td>Filter Pressure</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Dialysis</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224149</th>\n",
+       "      <td>Access Pressure</td>\n",
+       "      <td>Access Pressure</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Dialysis</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227991</th>\n",
+       "      <td>Intra Cranial Pressure #2 Alarm - Low</td>\n",
+       "      <td>IC2 Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226094</th>\n",
+       "      <td>Orthostatic BPd sitting</td>\n",
+       "      <td>Orthostatic BPd sitting</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226092</th>\n",
+       "      <td>Orthostatic BPd lying</td>\n",
+       "      <td>Orthostatic BPd lying</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227990</th>\n",
+       "      <td>Intra Cranial Pressure #2 Alarm - High</td>\n",
+       "      <td>IC2 Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                           label              abbreviation  \\\n",
+       "itemid                                                                       \n",
+       "226063                        Venous O2 Pressure              PO2 (Venous)   \n",
+       "225312                               ART BP mean               ART BP mean   \n",
+       "225310                          ART BP Diastolic          ART BP Diastolic   \n",
+       "225309                           ART BP Systolic           ART BP Systolic   \n",
+       "223751  Non-Invasive Blood Pressure Alarm - High          NBP Alarm - High   \n",
+       "227516                        PO2 (Mixed Venous)        PO2 (Mixed Venous)   \n",
+       "224166                                Doppler BP                Doppler BP   \n",
+       "224167       Manual Blood Pressure Systolic Left              Manual BPs L   \n",
+       "226737                        AaDO2ApacheIIValue        AaDO2ApacheIIValue   \n",
+       "228148                  ABI Ankle BP R (Impella)  ABI Ankle BP R (Impella)   \n",
+       "220224                      Arterial O2 pressure            PO2 (Arterial)   \n",
+       "220235                     Arterial CO2 Pressure           PCO2 (Arterial)   \n",
+       "223752   Non-Invasive Blood Pressure Alarm - Low           NBP Alarm - Low   \n",
+       "223763                          Bladder Pressure          Bladder Pressure   \n",
+       "224150                           Filter Pressure           Filter Pressure   \n",
+       "224149                           Access Pressure           Access Pressure   \n",
+       "227991     Intra Cranial Pressure #2 Alarm - Low           IC2 Alarm - Low   \n",
+       "226094                   Orthostatic BPd sitting   Orthostatic BPd sitting   \n",
+       "226092                     Orthostatic BPd lying     Orthostatic BPd lying   \n",
+       "227990    Intra Cranial Pressure #2 Alarm - High          IC2 Alarm - High   \n",
+       "\n",
+       "            linksto             category unitname  score  \n",
+       "itemid                                                    \n",
+       "226063  chartevents                 Labs     mmHg  110.0  \n",
+       "225312  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "225310  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "225309  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "223751  chartevents               Alarms     mmHg  110.0  \n",
+       "227516  chartevents                 Labs     mmHg  110.0  \n",
+       "224166  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "224167  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "226737  chartevents   Scores - APACHE II     mmHg  110.0  \n",
+       "228148  chartevents              Impella     mmHg  110.0  \n",
+       "220224  chartevents                 Labs     mmHg  110.0  \n",
+       "220235  chartevents                 Labs     mmHg  110.0  \n",
+       "223752  chartevents               Alarms     mmHg  110.0  \n",
+       "223763  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "224150  chartevents             Dialysis     mmHg  110.0  \n",
+       "224149  chartevents             Dialysis     mmHg  110.0  \n",
+       "227991  chartevents               Alarms     mmHg  110.0  \n",
+       "226094  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "226092  chartevents  Routine Vital Signs     mmHg  110.0  \n",
+       "227990  chartevents               Alarms     mmHg  110.0  "
+      ]
+     },
+     "execution_count": 69,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] = [220179]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] = [220180]\n",
+    "out_df.iloc[20:40]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 70,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>227989</th>\n",
+       "      <td>Intra Cranial Pressure #2</td>\n",
+       "      <td>IC2</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220056</th>\n",
+       "      <td>Arterial Blood Pressure Alarm - Low</td>\n",
+       "      <td>ABP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220052</th>\n",
+       "      <td>Arterial Blood Pressure mean</td>\n",
+       "      <td>ABPm</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220051</th>\n",
+       "      <td>Arterial Blood Pressure diastolic</td>\n",
+       "      <td>ABPd</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220050</th>\n",
+       "      <td>Arterial Blood Pressure systolic</td>\n",
+       "      <td>ABPs</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228145</th>\n",
+       "      <td>ABI Ankle BP L</td>\n",
+       "      <td>ABI Ankle BP L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228146</th>\n",
+       "      <td>ABI Brachial BP R</td>\n",
+       "      <td>ABI Brachial BP R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227039</th>\n",
+       "      <td>PO2_ApacheIV</td>\n",
+       "      <td>PO2_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220765</th>\n",
+       "      <td>Intra Cranial Pressure</td>\n",
+       "      <td>ICP</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227023</th>\n",
+       "      <td>MAP_ApacheIV</td>\n",
+       "      <td>MAP_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224309</th>\n",
+       "      <td>Assisted Systole</td>\n",
+       "      <td>SYS - Assisted</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224310</th>\n",
+       "      <td>Augmented Diastole</td>\n",
+       "      <td>AUG</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224311</th>\n",
+       "      <td>BAEDP</td>\n",
+       "      <td>DIA - Assisted</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224314</th>\n",
+       "      <td>ABI Brachial BP R (Impella)</td>\n",
+       "      <td>ABI Brachial BP R (Impella)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224317</th>\n",
+       "      <td>ABI Ankle BP R</td>\n",
+       "      <td>ABI Ankle BP R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224318</th>\n",
+       "      <td>ABI Ankle BP L (Impella)</td>\n",
+       "      <td>ABI Ankle BP L (Impella)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224322</th>\n",
+       "      <td>IABP Mean</td>\n",
+       "      <td>MAP - Assisted</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223771</th>\n",
+       "      <td>PCWP</td>\n",
+       "      <td>PCWP</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223768</th>\n",
+       "      <td>Intra Cranial Pressure Alarm - Low</td>\n",
+       "      <td>ICP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223767</th>\n",
+       "      <td>Intra Cranial Pressure Alarm - High</td>\n",
+       "      <td>ICP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                      label                 abbreviation  \\\n",
+       "itemid                                                                     \n",
+       "227989            Intra Cranial Pressure #2                          IC2   \n",
+       "220056  Arterial Blood Pressure Alarm - Low              ABP Alarm - Low   \n",
+       "220052         Arterial Blood Pressure mean                         ABPm   \n",
+       "220051    Arterial Blood Pressure diastolic                         ABPd   \n",
+       "220050     Arterial Blood Pressure systolic                         ABPs   \n",
+       "228145                       ABI Ankle BP L              ABI Ankle BP L    \n",
+       "228146                    ABI Brachial BP R           ABI Brachial BP R    \n",
+       "227039                         PO2_ApacheIV                 PO2_ApacheIV   \n",
+       "220765               Intra Cranial Pressure                          ICP   \n",
+       "227023                         MAP_ApacheIV                 MAP_ApacheIV   \n",
+       "224309                     Assisted Systole               SYS - Assisted   \n",
+       "224310                   Augmented Diastole                          AUG   \n",
+       "224311                                BAEDP               DIA - Assisted   \n",
+       "224314          ABI Brachial BP R (Impella)  ABI Brachial BP R (Impella)   \n",
+       "224317                       ABI Ankle BP R               ABI Ankle BP R   \n",
+       "224318             ABI Ankle BP L (Impella)     ABI Ankle BP L (Impella)   \n",
+       "224322                            IABP Mean               MAP - Assisted   \n",
+       "223771                                 PCWP                         PCWP   \n",
+       "223768   Intra Cranial Pressure Alarm - Low              ICP Alarm - Low   \n",
+       "223767  Intra Cranial Pressure Alarm - High             ICP Alarm - High   \n",
+       "\n",
+       "            linksto                category unitname  score  \n",
+       "itemid                                                       \n",
+       "227989  chartevents            Hemodynamics     mmHg  110.0  \n",
+       "220056  chartevents                  Alarms     mmHg  110.0  \n",
+       "220052  chartevents     Routine Vital Signs     mmHg  110.0  \n",
+       "220051  chartevents     Routine Vital Signs     mmHg  110.0  \n",
+       "220050  chartevents     Routine Vital Signs     mmHg  110.0  \n",
+       "228145  chartevents                    IABP     mmHg  110.0  \n",
+       "228146  chartevents                    IABP     mmHg  110.0  \n",
+       "227039  chartevents  Scores - APACHE IV (2)     mmHg  110.0  \n",
+       "220765  chartevents            Hemodynamics     mmHg  110.0  \n",
+       "227023  chartevents  Scores - APACHE IV (2)     mmHg  110.0  \n",
+       "224309  chartevents                    IABP     mmHg  110.0  \n",
+       "224310  chartevents                    IABP     mmHg  110.0  \n",
+       "224311  chartevents                    IABP     mmHg  110.0  \n",
+       "224314  chartevents                 Impella     mmHg  110.0  \n",
+       "224317  chartevents                    IABP     mmHg  110.0  \n",
+       "224318  chartevents                 Impella     mmHg  110.0  \n",
+       "224322  chartevents                    IABP     mmHg  110.0  \n",
+       "223771  chartevents            Hemodynamics     mmHg  110.0  \n",
+       "223768  chartevents                  Alarms     mmHg  110.0  \n",
+       "223767  chartevents                  Alarms     mmHg  110.0  "
+      ]
+     },
+     "execution_count": 70,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [225309,224167]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [225310,224643]\n",
+    "out_df.iloc[40:60]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 71,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>223766</th>\n",
+       "      <td>Orthostatic BPs standing</td>\n",
+       "      <td>Orthostatic BPs standing</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228149</th>\n",
+       "      <td>ABI Brachial BP L (Impella)</td>\n",
+       "      <td>ABI Brachial BP L (Impella)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224151</th>\n",
+       "      <td>Effluent Pressure</td>\n",
+       "      <td>Effluent Pressure</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Dialysis</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224643</th>\n",
+       "      <td>Manual Blood Pressure Diastolic Left</td>\n",
+       "      <td>Manual BPd L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224654</th>\n",
+       "      <td>PAEDP</td>\n",
+       "      <td>DIA - Unassisted</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226855</th>\n",
+       "      <td>PCWP (mean) (PA Line)</td>\n",
+       "      <td>PCWP (mean) (PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226857</th>\n",
+       "      <td>PA mean pressure (PA Line)</td>\n",
+       "      <td>PA mean pressure (PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224646</th>\n",
+       "      <td>Orthostatic BPs sitting</td>\n",
+       "      <td>Orthostatic BPs sitting</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227716</th>\n",
+       "      <td>Cerebral Perfusion Pressure Alarm - High</td>\n",
+       "      <td>CPP Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227717</th>\n",
+       "      <td>Cerebral Perfusion Pressure Alarm - Low</td>\n",
+       "      <td>CPP Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224645</th>\n",
+       "      <td>Orthostatic BPs lying</td>\n",
+       "      <td>Orthostatic BPs lying</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227242</th>\n",
+       "      <td>Manual Blood Pressure Diastolic Right</td>\n",
+       "      <td>Manual BPd R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226766</th>\n",
+       "      <td>MapApacheIIValue</td>\n",
+       "      <td>MapApacheIIValue</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227243</th>\n",
+       "      <td>Manual Blood Pressure Systolic Right</td>\n",
+       "      <td>Manual BPs R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226853</th>\n",
+       "      <td>PA diastolic pressure(PA Line)</td>\n",
+       "      <td>PA diastolic pressure(PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226849</th>\n",
+       "      <td>RA (mean) pressure (PA Line)</td>\n",
+       "      <td>RA (mean) pressure (PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226850</th>\n",
+       "      <td>RV systolic pressure(PA Line)</td>\n",
+       "      <td>RV systolic pressure(PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226851</th>\n",
+       "      <td>RV diastolic pressure(PA Line)</td>\n",
+       "      <td>RV diastolic pressure(PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224659</th>\n",
+       "      <td>Vacuum Assist</td>\n",
+       "      <td>Vacuum Assist</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226854</th>\n",
+       "      <td>PCWP (v wave) (PA Line)</td>\n",
+       "      <td>PCWP (v wave) (PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                           label  \\\n",
+       "itemid                                             \n",
+       "223766                  Orthostatic BPs standing   \n",
+       "228149               ABI Brachial BP L (Impella)   \n",
+       "224151                         Effluent Pressure   \n",
+       "224643      Manual Blood Pressure Diastolic Left   \n",
+       "224654                                     PAEDP   \n",
+       "226855                     PCWP (mean) (PA Line)   \n",
+       "226857                PA mean pressure (PA Line)   \n",
+       "224646                   Orthostatic BPs sitting   \n",
+       "227716  Cerebral Perfusion Pressure Alarm - High   \n",
+       "227717   Cerebral Perfusion Pressure Alarm - Low   \n",
+       "224645                     Orthostatic BPs lying   \n",
+       "227242     Manual Blood Pressure Diastolic Right   \n",
+       "226766                          MapApacheIIValue   \n",
+       "227243      Manual Blood Pressure Systolic Right   \n",
+       "226853            PA diastolic pressure(PA Line)   \n",
+       "226849              RA (mean) pressure (PA Line)   \n",
+       "226850             RV systolic pressure(PA Line)   \n",
+       "226851            RV diastolic pressure(PA Line)   \n",
+       "224659                             Vacuum Assist   \n",
+       "226854                   PCWP (v wave) (PA Line)   \n",
+       "\n",
+       "                          abbreviation      linksto             category  \\\n",
+       "itemid                                                                     \n",
+       "223766        Orthostatic BPs standing  chartevents  Routine Vital Signs   \n",
+       "228149     ABI Brachial BP L (Impella)  chartevents              Impella   \n",
+       "224151               Effluent Pressure  chartevents             Dialysis   \n",
+       "224643                    Manual BPd L  chartevents  Routine Vital Signs   \n",
+       "224654                DIA - Unassisted  chartevents                 IABP   \n",
+       "226855           PCWP (mean) (PA Line)  chartevents    PA Line Insertion   \n",
+       "226857      PA mean pressure (PA Line)  chartevents    PA Line Insertion   \n",
+       "224646         Orthostatic BPs sitting  chartevents  Routine Vital Signs   \n",
+       "227716                CPP Alarm - High  chartevents               Alarms   \n",
+       "227717                 CPP Alarm - Low  chartevents               Alarms   \n",
+       "224645           Orthostatic BPs lying  chartevents  Routine Vital Signs   \n",
+       "227242                    Manual BPd R  chartevents  Routine Vital Signs   \n",
+       "226766                MapApacheIIValue  chartevents   Scores - APACHE II   \n",
+       "227243                    Manual BPs R  chartevents  Routine Vital Signs   \n",
+       "226853  PA diastolic pressure(PA Line)  chartevents    PA Line Insertion   \n",
+       "226849    RA (mean) pressure (PA Line)  chartevents    PA Line Insertion   \n",
+       "226850   RV systolic pressure(PA Line)  chartevents    PA Line Insertion   \n",
+       "226851  RV diastolic pressure(PA Line)  chartevents    PA Line Insertion   \n",
+       "224659                   Vacuum Assist  chartevents         Hemodynamics   \n",
+       "226854         PCWP (v wave) (PA Line)  chartevents    PA Line Insertion   \n",
+       "\n",
+       "       unitname  score  \n",
+       "itemid                  \n",
+       "223766     mmHg  110.0  \n",
+       "228149     mmHg  110.0  \n",
+       "224151     mmHg  110.0  \n",
+       "224643     mmHg  110.0  \n",
+       "224654     mmHg  110.0  \n",
+       "226855     mmHg  110.0  \n",
+       "226857     mmHg  110.0  \n",
+       "224646     mmHg  110.0  \n",
+       "227716     mmHg  110.0  \n",
+       "227717     mmHg  110.0  \n",
+       "224645     mmHg  110.0  \n",
+       "227242     mmHg  110.0  \n",
+       "226766     mmHg  110.0  \n",
+       "227243     mmHg  110.0  \n",
+       "226853     mmHg  110.0  \n",
+       "226849     mmHg  110.0  \n",
+       "226850     mmHg  110.0  \n",
+       "226851     mmHg  110.0  \n",
+       "224659     mmHg  110.0  \n",
+       "226854     mmHg  110.0  "
+      ]
+     },
+     "execution_count": 71,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [220050]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [220051]\n",
+    "out_df.iloc[60:80]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 72,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>228158</th>\n",
+       "      <td>Purge Pressure</td>\n",
+       "      <td>Purge Pressure</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226852</th>\n",
+       "      <td>PA systolic pressure(PA Line)</td>\n",
+       "      <td>PA systolic pressure(PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224652</th>\n",
+       "      <td>Unassisted Systole</td>\n",
+       "      <td>SYS - Unassisted</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>IABP</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7643</th>\n",
+       "      <td>RVSYSTOLIC</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>102.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8441</th>\n",
+       "      <td>NBP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8364</th>\n",
+       "      <td>ABP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8448</th>\n",
+       "      <td>PAP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>455</th>\n",
+       "      <td>NBP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>ABP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>492</th>\n",
+       "      <td>PAP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8508</th>\n",
+       "      <td>BP UAC [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>89.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8505</th>\n",
+       "      <td>BP PAL [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>89.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3319</th>\n",
+       "      <td>BP PAL [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3325</th>\n",
+       "      <td>BP UAC [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8502</th>\n",
+       "      <td>BP Cuff [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>87.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3313</th>\n",
+       "      <td>BP Cuff [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>86.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>153</th>\n",
+       "      <td>Diastolic Unloading</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>86.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227539</th>\n",
+       "      <td>ART Blood Pressure Alarm Source</td>\n",
+       "      <td>ART BP Alarm Source</td>\n",
+       "      <td></td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td></td>\n",
+       "      <td>84.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8440</th>\n",
+       "      <td>Manual BP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>666</th>\n",
+       "      <td>Systolic Unloading</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                  label                   abbreviation  \\\n",
+       "itemid                                                                   \n",
+       "228158                   Purge Pressure                 Purge Pressure   \n",
+       "226852    PA systolic pressure(PA Line)  PA systolic pressure(PA Line)   \n",
+       "224652               Unassisted Systole               SYS - Unassisted   \n",
+       "7643                         RVSYSTOLIC                                  \n",
+       "8441                    NBP [Diastolic]                                  \n",
+       "8364                    ABP [Diastolic]                                  \n",
+       "8448                    PAP [Diastolic]                                  \n",
+       "455                      NBP [Systolic]                                  \n",
+       "6                        ABP [Systolic]                                  \n",
+       "492                      PAP [Systolic]                                  \n",
+       "8508                 BP UAC [Diastolic]                                  \n",
+       "8505                 BP PAL [Diastolic]                                  \n",
+       "3319                  BP PAL [Systolic]                                  \n",
+       "3325                  BP UAC [Systolic]                                  \n",
+       "8502                BP Cuff [Diastolic]                                  \n",
+       "3313                 BP Cuff [Systolic]                                  \n",
+       "153                 Diastolic Unloading                                  \n",
+       "227539  ART Blood Pressure Alarm Source            ART BP Alarm Source   \n",
+       "8440              Manual BP [Diastolic]                                  \n",
+       "666                  Systolic Unloading                                  \n",
+       "\n",
+       "            linksto           category unitname       score  \n",
+       "itemid                                                       \n",
+       "228158  chartevents            Impella     mmHg  110.000000  \n",
+       "226852  chartevents  PA Line Insertion     mmHg  110.000000  \n",
+       "224652  chartevents               IABP     mmHg  110.000000  \n",
+       "7643    chartevents                              102.666667  \n",
+       "8441    chartevents                               95.666667  \n",
+       "8364    chartevents                               95.666667  \n",
+       "8448    chartevents                               95.666667  \n",
+       "455     chartevents                               94.333333  \n",
+       "6       chartevents                               94.333333  \n",
+       "492     chartevents                               94.333333  \n",
+       "8508    chartevents                               89.666667  \n",
+       "8505    chartevents                               89.666667  \n",
+       "3319    chartevents                               88.000000  \n",
+       "3325    chartevents                               88.000000  \n",
+       "8502    chartevents                               87.666667  \n",
+       "3313    chartevents                               86.333333  \n",
+       "153     chartevents                               86.000000  \n",
+       "227539                          Alarms            84.666667  \n",
+       "8440    chartevents                               84.666667  \n",
+       "666     chartevents                               84.666667  "
+      ]
+     },
+     "execution_count": 72,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [227243]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [227242]\n",
+    "out_df.iloc[80:100]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 73,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>6417</th>\n",
+       "      <td>low pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7133</th>\n",
+       "      <td>abd pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6944</th>\n",
+       "      <td>LOW PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2027</th>\n",
+       "      <td>Low pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6107</th>\n",
+       "      <td>Low Pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>442</th>\n",
+       "      <td>Manual BP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>83.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8503</th>\n",
+       "      <td>BP Left Arm [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8504</th>\n",
+       "      <td>BP Left Leg [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8368</th>\n",
+       "      <td>Arterial BP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8506</th>\n",
+       "      <td>BP Right Arm [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8507</th>\n",
+       "      <td>BP Right Leg [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51</th>\n",
+       "      <td>Arterial BP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3315</th>\n",
+       "      <td>BP Left Arm [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3317</th>\n",
+       "      <td>BP Left Leg [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3321</th>\n",
+       "      <td>BP Right Arm [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3323</th>\n",
+       "      <td>BP Right Leg [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8555</th>\n",
+       "      <td>Arterial BP #2 [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>29</th>\n",
+       "      <td>Access mmHg</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44560</th>\n",
+       "      <td>blood</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>70015</th>\n",
+       "      <td>BLOOD</td>\n",
+       "      <td></td>\n",
+       "      <td>microbiologyevents</td>\n",
+       "      <td>SPECIMEN</td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                             label abbreviation             linksto  category  \\\n",
+       "itemid                                                                          \n",
+       "6417                  low pressure                      chartevents             \n",
+       "7133                  abd pressure                      chartevents             \n",
+       "6944                  LOW PRESSURE                      chartevents             \n",
+       "2027                  Low pressure                      chartevents             \n",
+       "6107                  Low Pressure                      chartevents             \n",
+       "442           Manual BP [Systolic]                      chartevents             \n",
+       "8503       BP Left Arm [Diastolic]                      chartevents             \n",
+       "8504       BP Left Leg [Diastolic]                      chartevents             \n",
+       "8368       Arterial BP [Diastolic]                      chartevents             \n",
+       "8506      BP Right Arm [Diastolic]                      chartevents             \n",
+       "8507      BP Right Leg [Diastolic]                      chartevents             \n",
+       "51          Arterial BP [Systolic]                      chartevents             \n",
+       "3315        BP Left Arm [Systolic]                      chartevents             \n",
+       "3317        BP Left Leg [Systolic]                      chartevents             \n",
+       "3321       BP Right Arm [Systolic]                      chartevents             \n",
+       "3323       BP Right Leg [Systolic]                      chartevents             \n",
+       "8555    Arterial BP #2 [Diastolic]                      chartevents             \n",
+       "29                     Access mmHg                      chartevents             \n",
+       "44560                        blood                   inputevents_cv             \n",
+       "70015                        BLOOD               microbiologyevents  SPECIMEN   \n",
+       "\n",
+       "       unitname      score  \n",
+       "itemid                      \n",
+       "6417             84.333333  \n",
+       "7133             84.333333  \n",
+       "6944             84.333333  \n",
+       "2027             84.333333  \n",
+       "6107             84.333333  \n",
+       "442              83.000000  \n",
+       "8503             82.000000  \n",
+       "8504             82.000000  \n",
+       "8368             82.000000  \n",
+       "8506             81.000000  \n",
+       "8507             81.000000  \n",
+       "51               80.000000  \n",
+       "3315             80.000000  \n",
+       "3317             80.000000  \n",
+       "3321             79.000000  \n",
+       "3323             79.000000  \n",
+       "8555             79.000000  \n",
+       "29               78.666667  \n",
+       "44560            78.666667  \n",
+       "70015            78.666667  "
+      ]
+     },
+     "execution_count": 73,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [455,6]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8441,8364]\n",
+    "out_df.iloc[100:120]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 74,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>51466</th>\n",
+       "      <td>BLOOD</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6127</th>\n",
+       "      <td>LO Press</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46780</th>\n",
+       "      <td>Bladdar pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1404</th>\n",
+       "      <td>Bladder pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>993</th>\n",
+       "      <td>bladder pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6701</th>\n",
+       "      <td>Arterial BP #2 [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1411</th>\n",
+       "      <td>Bladder Pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>996</th>\n",
+       "      <td>BLADDER PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44862</th>\n",
+       "      <td>BLADDER PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>77.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>770</th>\n",
+       "      <td>AST</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Enzymes</td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220587</th>\n",
+       "      <td>AST</td>\n",
+       "      <td>AST</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>None</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2347</th>\n",
+       "      <td>BLADDER PRESSURE.</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>76.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6631</th>\n",
+       "      <td>pressure low</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>75.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3108</th>\n",
+       "      <td>PA PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>75.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7504</th>\n",
+       "      <td>Driv pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>75.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2779</th>\n",
+       "      <td>bladder pressures</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>75.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43763</th>\n",
+       "      <td>Bladder presure</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>74.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1509</th>\n",
+       "      <td>bld pres</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>73.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6540</th>\n",
+       "      <td>IntraABd pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>73.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8444</th>\n",
+       "      <td>Orthostat BP sitting [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>73.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                   label abbreviation         linksto  \\\n",
+       "itemid                                                                  \n",
+       "51466                              BLOOD          NaN       labevents   \n",
+       "6127                            LO Press                  chartevents   \n",
+       "46780                   Bladdar pressure               inputevents_cv   \n",
+       "1404                    Bladder pressure                  chartevents   \n",
+       "993                     bladder pressure                  chartevents   \n",
+       "6701           Arterial BP #2 [Systolic]                  chartevents   \n",
+       "1411                    Bladder Pressure                  chartevents   \n",
+       "996                     BLADDER PRESSURE                  chartevents   \n",
+       "44862                   BLADDER PRESSURE               inputevents_cv   \n",
+       "770                                  AST                  chartevents   \n",
+       "220587                               AST          AST     chartevents   \n",
+       "2347                   BLADDER PRESSURE.                  chartevents   \n",
+       "6631                        pressure low                  chartevents   \n",
+       "3108                         PA PRESSURE                  chartevents   \n",
+       "7504                       Driv pressure                  chartevents   \n",
+       "2779                   bladder pressures                  chartevents   \n",
+       "43763                    Bladder presure               inputevents_cv   \n",
+       "1509                            bld pres                  chartevents   \n",
+       "6540                   IntraABd pressure                  chartevents   \n",
+       "8444    Orthostat BP sitting [Diastolic]                  chartevents   \n",
+       "\n",
+       "                category unitname      score  \n",
+       "itemid                                        \n",
+       "51466         HEMATOLOGY      NaN  78.666667  \n",
+       "6127                               78.000000  \n",
+       "46780                              77.000000  \n",
+       "1404                               77.000000  \n",
+       "993                                77.000000  \n",
+       "6701                               77.000000  \n",
+       "1411                               77.000000  \n",
+       "996                                77.000000  \n",
+       "44862   Free Form Intake           77.000000  \n",
+       "770              Enzymes           76.666667  \n",
+       "220587              Labs     None  76.666667  \n",
+       "2347                               76.000000  \n",
+       "6631                               75.666667  \n",
+       "3108                               75.333333  \n",
+       "7504                               75.000000  \n",
+       "2779                               75.000000  \n",
+       "43763                              74.333333  \n",
+       "1509                               73.666667  \n",
+       "6540                               73.666667  \n",
+       "8444                               73.333333  "
+      ]
+     },
+     "execution_count": 74,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [3313]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8502,8440]\n",
+    "out_df.iloc[120:140]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 75,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>8446</th>\n",
+       "      <td>Orthostatic BP lying [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>73.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8445</th>\n",
+       "      <td>OrthostatBP standing [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>73.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6302</th>\n",
+       "      <td>low press</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>72.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2562</th>\n",
+       "      <td>INTRA ABD PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>72.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45682</th>\n",
+       "      <td>bladder pressure in</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>72.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7124</th>\n",
+       "      <td>Low pressure Alarm</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>72.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43744</th>\n",
+       "      <td>NS bladder pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>72.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228151</th>\n",
+       "      <td>Aortic Pressure Signal - Diastolic</td>\n",
+       "      <td>Aortic Pressure Signal - Diastolic</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>None</td>\n",
+       "      <td>72.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42735</th>\n",
+       "      <td>Intra-abd. Pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>71.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>484</th>\n",
+       "      <td>Orthostatic BP lying [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>482</th>\n",
+       "      <td>OrthostatBP standing [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>480</th>\n",
+       "      <td>Orthostat BP sitting [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44344</th>\n",
+       "      <td>BLADDER PRESSURE FLD</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>71.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44187</th>\n",
+       "      <td>Blood emesis</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>71.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3238</th>\n",
+       "      <td>CSF PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>71.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2965</th>\n",
+       "      <td>INTRAABDOM. PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>70.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228152</th>\n",
+       "      <td>Aortic Pressure Signal - Systolic</td>\n",
+       "      <td>Aortic Pressure Signal - Systolic</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>None</td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50934</th>\n",
+       "      <td>H</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>CHEMISTRY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7574</th>\n",
+       "      <td>lumbar pressure</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>69.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2704</th>\n",
+       "      <td>ABDOMINAL PRESSURE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>69.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                     label  \\\n",
+       "itemid                                       \n",
+       "8446      Orthostatic BP lying [Diastolic]   \n",
+       "8445      OrthostatBP standing [Diastolic]   \n",
+       "6302                             low press   \n",
+       "2562                    INTRA ABD PRESSURE   \n",
+       "45682                  bladder pressure in   \n",
+       "7124                    Low pressure Alarm   \n",
+       "43744                  NS bladder pressure   \n",
+       "228151  Aortic Pressure Signal - Diastolic   \n",
+       "42735                  Intra-abd. Pressure   \n",
+       "484        Orthostatic BP lying [Systolic]   \n",
+       "482        OrthostatBP standing [Systolic]   \n",
+       "480        Orthostat BP sitting [Systolic]   \n",
+       "44344                 BLADDER PRESSURE FLD   \n",
+       "44187                         Blood emesis   \n",
+       "3238                          CSF PRESSURE   \n",
+       "2965                  INTRAABDOM. PRESSURE   \n",
+       "228152   Aortic Pressure Signal - Systolic   \n",
+       "50934                                    H   \n",
+       "7574                       lumbar pressure   \n",
+       "2704                    ABDOMINAL PRESSURE   \n",
+       "\n",
+       "                              abbreviation         linksto          category  \\\n",
+       "itemid                                                                         \n",
+       "8446                                           chartevents                     \n",
+       "8445                                           chartevents                     \n",
+       "6302                                           chartevents                     \n",
+       "2562                                           chartevents                     \n",
+       "45682                                       inputevents_cv  Free Form Intake   \n",
+       "7124                                           chartevents                     \n",
+       "43744                                       inputevents_cv  Free Form Intake   \n",
+       "228151  Aortic Pressure Signal - Diastolic     chartevents           Impella   \n",
+       "42735                                       inputevents_cv  Free Form Intake   \n",
+       "484                                            chartevents                     \n",
+       "482                                            chartevents                     \n",
+       "480                                            chartevents                     \n",
+       "44344                                       inputevents_cv  Free Form Intake   \n",
+       "44187                                         outputevents  Free Form Intake   \n",
+       "3238                                           chartevents                     \n",
+       "2965                                           chartevents                     \n",
+       "228152   Aortic Pressure Signal - Systolic     chartevents           Impella   \n",
+       "50934                                  NaN       labevents         CHEMISTRY   \n",
+       "7574                                           chartevents                     \n",
+       "2704                                           chartevents                     \n",
+       "\n",
+       "       unitname      score  \n",
+       "itemid                      \n",
+       "8446             73.333333  \n",
+       "8445             73.333333  \n",
+       "6302             72.666667  \n",
+       "2562             72.333333  \n",
+       "45682            72.333333  \n",
+       "7124             72.333333  \n",
+       "43744            72.333333  \n",
+       "228151     None  72.000000  \n",
+       "42735            71.666667  \n",
+       "484              71.333333  \n",
+       "482              71.333333  \n",
+       "480              71.333333  \n",
+       "44344            71.000000  \n",
+       "44187            71.000000  \n",
+       "3238             71.000000  \n",
+       "2965             70.333333  \n",
+       "228152     None  70.000000  \n",
+       "50934       NaN  70.000000  \n",
+       "7574             69.666667  \n",
+       "2704             69.666667  "
+      ]
+     },
+     "execution_count": 75,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [442,3315,51,3317]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8368,8503,8504,8507,8506]\n",
+    "out_df.iloc[140:160]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 76,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [3321,3323]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC] += [8555]\n",
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_MEAN] = [220181,225312,220052]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC] += [6701]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 77,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>220179</th>\n",
+       "      <td>Non Invasive Blood Pressure systolic</td>\n",
+       "      <td>NBPs</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225309</th>\n",
+       "      <td>ART BP Systolic</td>\n",
+       "      <td>ART BP Systolic</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224167</th>\n",
+       "      <td>Manual Blood Pressure Systolic Left</td>\n",
+       "      <td>Manual BPs L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220050</th>\n",
+       "      <td>Arterial Blood Pressure systolic</td>\n",
+       "      <td>ABPs</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227243</th>\n",
+       "      <td>Manual Blood Pressure Systolic Right</td>\n",
+       "      <td>Manual BPs R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>455</th>\n",
+       "      <td>NBP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>ABP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3313</th>\n",
+       "      <td>BP Cuff [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>86.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>442</th>\n",
+       "      <td>Manual BP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>83.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3315</th>\n",
+       "      <td>BP Left Arm [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51</th>\n",
+       "      <td>Arterial BP [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3317</th>\n",
+       "      <td>BP Left Leg [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3321</th>\n",
+       "      <td>BP Right Arm [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3323</th>\n",
+       "      <td>BP Right Leg [Systolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                       label     abbreviation      linksto  \\\n",
+       "itemid                                                                       \n",
+       "220179  Non Invasive Blood Pressure systolic             NBPs  chartevents   \n",
+       "225309                       ART BP Systolic  ART BP Systolic  chartevents   \n",
+       "224167   Manual Blood Pressure Systolic Left     Manual BPs L  chartevents   \n",
+       "220050      Arterial Blood Pressure systolic             ABPs  chartevents   \n",
+       "227243  Manual Blood Pressure Systolic Right     Manual BPs R  chartevents   \n",
+       "455                           NBP [Systolic]                   chartevents   \n",
+       "6                             ABP [Systolic]                   chartevents   \n",
+       "3313                      BP Cuff [Systolic]                   chartevents   \n",
+       "442                     Manual BP [Systolic]                   chartevents   \n",
+       "3315                  BP Left Arm [Systolic]                   chartevents   \n",
+       "51                    Arterial BP [Systolic]                   chartevents   \n",
+       "3317                  BP Left Leg [Systolic]                   chartevents   \n",
+       "3321                 BP Right Arm [Systolic]                   chartevents   \n",
+       "3323                 BP Right Leg [Systolic]                   chartevents   \n",
+       "\n",
+       "                   category unitname       score  \n",
+       "itemid                                            \n",
+       "220179  Routine Vital Signs     mmHg  110.000000  \n",
+       "225309  Routine Vital Signs     mmHg  110.000000  \n",
+       "224167  Routine Vital Signs     mmHg  110.000000  \n",
+       "220050  Routine Vital Signs     mmHg  110.000000  \n",
+       "227243  Routine Vital Signs     mmHg  110.000000  \n",
+       "455                                    94.333333  \n",
+       "6                                      94.333333  \n",
+       "3313                                   86.333333  \n",
+       "442                                    83.000000  \n",
+       "3315                                   80.000000  \n",
+       "51                                     80.000000  \n",
+       "3317                                   80.000000  \n",
+       "3321                                   79.000000  \n",
+       "3323                                   79.000000  "
+      ]
+     },
+     "execution_count": 77,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df.loc[keep_dict[data_dict.labels.BLOOD_PRESSURE_SYSTOLIC]]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 79,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>220180</th>\n",
+       "      <td>Non Invasive Blood Pressure diastolic</td>\n",
+       "      <td>NBPd</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225310</th>\n",
+       "      <td>ART BP Diastolic</td>\n",
+       "      <td>ART BP Diastolic</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224643</th>\n",
+       "      <td>Manual Blood Pressure Diastolic Left</td>\n",
+       "      <td>Manual BPd L</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220051</th>\n",
+       "      <td>Arterial Blood Pressure diastolic</td>\n",
+       "      <td>ABPd</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227242</th>\n",
+       "      <td>Manual Blood Pressure Diastolic Right</td>\n",
+       "      <td>Manual BPd R</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8441</th>\n",
+       "      <td>NBP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8364</th>\n",
+       "      <td>ABP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8502</th>\n",
+       "      <td>BP Cuff [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>87.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8440</th>\n",
+       "      <td>Manual BP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8368</th>\n",
+       "      <td>Arterial BP [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8503</th>\n",
+       "      <td>BP Left Arm [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8504</th>\n",
+       "      <td>BP Left Leg [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8507</th>\n",
+       "      <td>BP Right Leg [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8506</th>\n",
+       "      <td>BP Right Arm [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8555</th>\n",
+       "      <td>Arterial BP #2 [Diastolic]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                        label      abbreviation      linksto  \\\n",
+       "itemid                                                                         \n",
+       "220180  Non Invasive Blood Pressure diastolic              NBPd  chartevents   \n",
+       "225310                       ART BP Diastolic  ART BP Diastolic  chartevents   \n",
+       "224643   Manual Blood Pressure Diastolic Left      Manual BPd L  chartevents   \n",
+       "220051      Arterial Blood Pressure diastolic              ABPd  chartevents   \n",
+       "227242  Manual Blood Pressure Diastolic Right      Manual BPd R  chartevents   \n",
+       "8441                          NBP [Diastolic]                    chartevents   \n",
+       "8364                          ABP [Diastolic]                    chartevents   \n",
+       "8502                      BP Cuff [Diastolic]                    chartevents   \n",
+       "8440                    Manual BP [Diastolic]                    chartevents   \n",
+       "8368                  Arterial BP [Diastolic]                    chartevents   \n",
+       "8503                  BP Left Arm [Diastolic]                    chartevents   \n",
+       "8504                  BP Left Leg [Diastolic]                    chartevents   \n",
+       "8507                 BP Right Leg [Diastolic]                    chartevents   \n",
+       "8506                 BP Right Arm [Diastolic]                    chartevents   \n",
+       "8555               Arterial BP #2 [Diastolic]                    chartevents   \n",
+       "\n",
+       "                   category unitname       score  \n",
+       "itemid                                            \n",
+       "220180  Routine Vital Signs     mmHg  110.000000  \n",
+       "225310  Routine Vital Signs     mmHg  110.000000  \n",
+       "224643  Routine Vital Signs     mmHg  110.000000  \n",
+       "220051  Routine Vital Signs     mmHg  110.000000  \n",
+       "227242  Routine Vital Signs     mmHg  110.000000  \n",
+       "8441                                   95.666667  \n",
+       "8364                                   95.666667  \n",
+       "8502                                   87.666667  \n",
+       "8440                                   84.666667  \n",
+       "8368                                   82.000000  \n",
+       "8503                                   82.000000  \n",
+       "8504                                   82.000000  \n",
+       "8507                                   81.000000  \n",
+       "8506                                   81.000000  \n",
+       "8555                                   79.000000  "
+      ]
+     },
+     "execution_count": 79,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df.loc[keep_dict[data_dict.labels.BLOOD_PRESSURE_DIASTOLIC]]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### O2 Sat"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 80,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>50817</th>\n",
+       "      <td>OXYGEN SATURATION</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220277</th>\n",
+       "      <td>O2 saturation pulseoxymetry</td>\n",
+       "      <td>SpO2</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>%</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>646</th>\n",
+       "      <td>SpO2</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228232</th>\n",
+       "      <td>PAR-Oxygen saturation</td>\n",
+       "      <td>PAR-Oxygen saturation</td>\n",
+       "      <td></td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td></td>\n",
+       "      <td>102.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3785</th>\n",
+       "      <td>PO2</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>ABG's</td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3837</th>\n",
+       "      <td>pO2</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>ABG'S</td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50821</th>\n",
+       "      <td>PO2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6719</th>\n",
+       "      <td>SpO2-L</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1341</th>\n",
+       "      <td>PULSE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1725</th>\n",
+       "      <td>Pulse</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1332</th>\n",
+       "      <td>pulse</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50816</th>\n",
+       "      <td>OXYGEN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>78.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2955</th>\n",
+       "      <td>JVO2 SAT</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2574</th>\n",
+       "      <td>MVO2 SAT</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227873</th>\n",
+       "      <td>Recovery O2 Sat - Aerobic Capacity</td>\n",
+       "      <td>Recovery O2 Sat - Aerobic Capacity</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>OT Notes</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223772</th>\n",
+       "      <td>SvO2</td>\n",
+       "      <td>SvO2</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223769</th>\n",
+       "      <td>O2 Saturation Pulseoxymetry Alarm - High</td>\n",
+       "      <td>SpO2 Alarm - High</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227867</th>\n",
+       "      <td>Activity O2 Sat - Aerobic Capacity</td>\n",
+       "      <td>Activity O2 Sat - Aerobic Capacity</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>OT Notes</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223770</th>\n",
+       "      <td>O2 Saturation Pulseoxymetry Alarm - Low</td>\n",
+       "      <td>SpO2 Alarm - Low</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226861</th>\n",
+       "      <td>ART %O2 saturation (PA Line)</td>\n",
+       "      <td>ART %O2 saturation (PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225674</th>\n",
+       "      <td>Mixed Venous O2% Sat</td>\n",
+       "      <td>Mixed Venous O2% Sat</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226862</th>\n",
+       "      <td>PA %O2 Saturation (PA Line)</td>\n",
+       "      <td>PA %O2 Saturation (PA Line)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PA Line Insertion</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227686</th>\n",
+       "      <td>Central Venous O2% Sat</td>\n",
+       "      <td>Central Venous O2% Sat</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227546</th>\n",
+       "      <td>SVV (Arterial)</td>\n",
+       "      <td>SVV (Arterial)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227549</th>\n",
+       "      <td>ScvO2 (Presep)</td>\n",
+       "      <td>ScvO2 (Presep)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226993</th>\n",
+       "      <td>ApacheIV_LOS</td>\n",
+       "      <td>ApacheIV_LOS</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227008</th>\n",
+       "      <td>Ejection Fraction</td>\n",
+       "      <td>Ejection Fraction</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227010</th>\n",
+       "      <td>FiO2_ApacheIV</td>\n",
+       "      <td>FiO2_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226272</th>\n",
+       "      <td>EF (CCO)</td>\n",
+       "      <td>EF (CCO)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hemodynamics</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228184</th>\n",
+       "      <td>SVV (PiCCO)</td>\n",
+       "      <td>SVV (PiCCO)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PiCCO</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227861</th>\n",
+       "      <td>Rest O2 Sat - Aerobic Capacity</td>\n",
+       "      <td>Rest O2 Sat - Aerobic Capacity</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>OT Notes</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226253</th>\n",
+       "      <td>SpO2 Desat Limit</td>\n",
+       "      <td>SpO2 Desat Limit</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Alarms</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224704</th>\n",
+       "      <td>ATC %</td>\n",
+       "      <td>ATC %</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Respiratory</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228378</th>\n",
+       "      <td>TFCd (NICOM)</td>\n",
+       "      <td>TFCd (NICOM)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>NICOM</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226745</th>\n",
+       "      <td>APACHE II Predecited Death Rate</td>\n",
+       "      <td>APACHE II PDR</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227919</th>\n",
+       "      <td>Rest O2 Sat - Aerobic Activity Response</td>\n",
+       "      <td>Rest O2 Sat - Aerobic Activity Response</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>OT Notes</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226744</th>\n",
+       "      <td>APACHE II PDR - Adjusted</td>\n",
+       "      <td>APACHE II PDR - Adjusted</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228377</th>\n",
+       "      <td>SVI Change</td>\n",
+       "      <td>SVI Change</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>NICOM</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226754</th>\n",
+       "      <td>FiO2ApacheIIValue</td>\n",
+       "      <td>FiO2ApacheIIValue</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228375</th>\n",
+       "      <td>Stroke Volume Index (SVI NICOM)</td>\n",
+       "      <td>Stroke Volume Index (SVI NICOM)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>NICOM</td>\n",
+       "      <td>%</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                           label  \\\n",
+       "itemid                                             \n",
+       "50817                          OXYGEN SATURATION   \n",
+       "220277               O2 saturation pulseoxymetry   \n",
+       "646                                         SpO2   \n",
+       "228232                     PAR-Oxygen saturation   \n",
+       "3785                                         PO2   \n",
+       "3837                                         pO2   \n",
+       "50821                                        PO2   \n",
+       "6719                                      SpO2-L   \n",
+       "1341                                       PULSE   \n",
+       "1725                                       Pulse   \n",
+       "1332                                       pulse   \n",
+       "50816                                     OXYGEN   \n",
+       "2955                                    JVO2 SAT   \n",
+       "2574                                    MVO2 SAT   \n",
+       "227873        Recovery O2 Sat - Aerobic Capacity   \n",
+       "223772                                      SvO2   \n",
+       "223769  O2 Saturation Pulseoxymetry Alarm - High   \n",
+       "227867        Activity O2 Sat - Aerobic Capacity   \n",
+       "223770   O2 Saturation Pulseoxymetry Alarm - Low   \n",
+       "226861              ART %O2 saturation (PA Line)   \n",
+       "225674                      Mixed Venous O2% Sat   \n",
+       "226862               PA %O2 Saturation (PA Line)   \n",
+       "227686                    Central Venous O2% Sat   \n",
+       "227546                            SVV (Arterial)   \n",
+       "227549                            ScvO2 (Presep)   \n",
+       "226993                              ApacheIV_LOS   \n",
+       "227008                         Ejection Fraction   \n",
+       "227010                             FiO2_ApacheIV   \n",
+       "226272                                  EF (CCO)   \n",
+       "228184                               SVV (PiCCO)   \n",
+       "227861            Rest O2 Sat - Aerobic Capacity   \n",
+       "226253                          SpO2 Desat Limit   \n",
+       "224704                                     ATC %   \n",
+       "228378                              TFCd (NICOM)   \n",
+       "226745           APACHE II Predecited Death Rate   \n",
+       "227919   Rest O2 Sat - Aerobic Activity Response   \n",
+       "226744                  APACHE II PDR - Adjusted   \n",
+       "228377                                SVI Change   \n",
+       "226754                         FiO2ApacheIIValue   \n",
+       "228375           Stroke Volume Index (SVI NICOM)   \n",
+       "\n",
+       "                                   abbreviation      linksto  \\\n",
+       "itemid                                                         \n",
+       "50817                                       NaN    labevents   \n",
+       "220277                                     SpO2  chartevents   \n",
+       "646                                              chartevents   \n",
+       "228232                    PAR-Oxygen saturation                \n",
+       "3785                                             chartevents   \n",
+       "3837                                             chartevents   \n",
+       "50821                                       NaN    labevents   \n",
+       "6719                                             chartevents   \n",
+       "1341                                             chartevents   \n",
+       "1725                                             chartevents   \n",
+       "1332                                             chartevents   \n",
+       "50816                                       NaN    labevents   \n",
+       "2955                                             chartevents   \n",
+       "2574                                             chartevents   \n",
+       "227873       Recovery O2 Sat - Aerobic Capacity  chartevents   \n",
+       "223772                                     SvO2  chartevents   \n",
+       "223769                        SpO2 Alarm - High  chartevents   \n",
+       "227867       Activity O2 Sat - Aerobic Capacity  chartevents   \n",
+       "223770                         SpO2 Alarm - Low  chartevents   \n",
+       "226861             ART %O2 saturation (PA Line)  chartevents   \n",
+       "225674                     Mixed Venous O2% Sat  chartevents   \n",
+       "226862              PA %O2 Saturation (PA Line)  chartevents   \n",
+       "227686                   Central Venous O2% Sat  chartevents   \n",
+       "227546                           SVV (Arterial)  chartevents   \n",
+       "227549                           ScvO2 (Presep)  chartevents   \n",
+       "226993                             ApacheIV_LOS  chartevents   \n",
+       "227008                        Ejection Fraction  chartevents   \n",
+       "227010                            FiO2_ApacheIV  chartevents   \n",
+       "226272                                 EF (CCO)  chartevents   \n",
+       "228184                              SVV (PiCCO)  chartevents   \n",
+       "227861           Rest O2 Sat - Aerobic Capacity  chartevents   \n",
+       "226253                         SpO2 Desat Limit  chartevents   \n",
+       "224704                                    ATC %  chartevents   \n",
+       "228378                             TFCd (NICOM)  chartevents   \n",
+       "226745                            APACHE II PDR  chartevents   \n",
+       "227919  Rest O2 Sat - Aerobic Activity Response  chartevents   \n",
+       "226744                 APACHE II PDR - Adjusted  chartevents   \n",
+       "228377                               SVI Change  chartevents   \n",
+       "226754                        FiO2ApacheIIValue  chartevents   \n",
+       "228375          Stroke Volume Index (SVI NICOM)  chartevents   \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "50817                BLOOD GAS      NaN  110.000000  \n",
+       "220277             Respiratory        %  110.000000  \n",
+       "646                                      110.000000  \n",
+       "228232     Routine Vital Signs           102.666667  \n",
+       "3785                     ABG's           100.666667  \n",
+       "3837                     ABG'S           100.666667  \n",
+       "50821                BLOOD GAS      NaN  100.666667  \n",
+       "6719                                      96.666667  \n",
+       "1341                                      78.666667  \n",
+       "1725                                      78.666667  \n",
+       "1332                                      78.666667  \n",
+       "50816                BLOOD GAS      NaN   78.000000  \n",
+       "2955                                      78.000000  \n",
+       "2574                                      78.000000  \n",
+       "227873                OT Notes        %   76.666667  \n",
+       "223772            Hemodynamics        %   76.666667  \n",
+       "223769                  Alarms        %   76.666667  \n",
+       "227867                OT Notes        %   76.666667  \n",
+       "223770                  Alarms        %   76.666667  \n",
+       "226861       PA Line Insertion        %   76.666667  \n",
+       "225674                    Labs        %   76.666667  \n",
+       "226862       PA Line Insertion        %   76.666667  \n",
+       "227686                    Labs        %   76.666667  \n",
+       "227546            Hemodynamics        %   76.666667  \n",
+       "227549            Hemodynamics        %   76.666667  \n",
+       "226993  Scores - APACHE IV (2)        %   76.666667  \n",
+       "227008  Scores - APACHE IV (2)        %   76.666667  \n",
+       "227010  Scores - APACHE IV (2)        %   76.666667  \n",
+       "226272            Hemodynamics        %   76.666667  \n",
+       "228184                   PiCCO        %   76.666667  \n",
+       "227861                OT Notes        %   76.666667  \n",
+       "226253                  Alarms        %   76.666667  \n",
+       "224704             Respiratory        %   76.666667  \n",
+       "228378                   NICOM        %   76.666667  \n",
+       "226745      Scores - APACHE II        %   76.666667  \n",
+       "227919                OT Notes        %   76.666667  \n",
+       "226744      Scores - APACHE II        %   76.666667  \n",
+       "228377                   NICOM        %   76.666667  \n",
+       "226754      Scores - APACHE II        %   76.666667  \n",
+       "228375                   NICOM        %   76.666667  "
+      ]
+     },
+     "execution_count": 80,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'oxygen saturation',\n",
+    "        'O2sat',\n",
+    "        'pulse oximetry',\n",
+    "        '%',\n",
+    "        'spo2'\n",
+    "    ])\n",
+    "out_df.head(40)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 81,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.OXYGEN_SATURATION_PULSE_OXIMETRY] = [646,220277,228232]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Body Temp"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 82,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>50825</th>\n",
+       "      <td>TEMPERATURE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226170</th>\n",
+       "      <td>Head of Bead Measurement</td>\n",
+       "      <td>HOB Measurement</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Treatments</td>\n",
+       "      <td>Degree</td>\n",
+       "      <td>104.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223762</th>\n",
+       "      <td>Temperature Celsius</td>\n",
+       "      <td>Temperature C</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>?C</td>\n",
+       "      <td>104.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223761</th>\n",
+       "      <td>Temperature Fahrenheit</td>\n",
+       "      <td>Temperature F</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td>?F</td>\n",
+       "      <td>104.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>678</th>\n",
+       "      <td>Temperature F</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>104.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>676</th>\n",
+       "      <td>Temperature C</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>104.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>591</th>\n",
+       "      <td>RLE [Temperature]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>98.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>597</th>\n",
+       "      <td>RUE [Temperature]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>98.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224027</th>\n",
+       "      <td>Skin Temperature</td>\n",
+       "      <td>Skin Temp</td>\n",
+       "      <td></td>\n",
+       "      <td>Skin - Assessment</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224642</th>\n",
+       "      <td>Temperature Site</td>\n",
+       "      <td>Temp Site</td>\n",
+       "      <td></td>\n",
+       "      <td>Routine Vital Signs</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>645</th>\n",
+       "      <td>Skin [Temperature]</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>679</th>\n",
+       "      <td>Temperature F (calc)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>92.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>677</th>\n",
+       "      <td>Temperature C (calc)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>92.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227054</th>\n",
+       "      <td>TemperatureF_ApacheIV</td>\n",
+       "      <td>TemperatureF_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>?F</td>\n",
+       "      <td>89.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224769</th>\n",
+       "      <td>LUE Temp</td>\n",
+       "      <td>LUE Temp</td>\n",
+       "      <td></td>\n",
+       "      <td>Cardiovascular</td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224771</th>\n",
+       "      <td>RLE Temp</td>\n",
+       "      <td>RLE Temp</td>\n",
+       "      <td></td>\n",
+       "      <td>Cardiovascular</td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224773</th>\n",
+       "      <td>LLE Temp</td>\n",
+       "      <td>LLE Temp</td>\n",
+       "      <td></td>\n",
+       "      <td>Cardiovascular</td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2798</th>\n",
+       "      <td>arm 90 degrees</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224674</th>\n",
+       "      <td>Changes in Temperature</td>\n",
+       "      <td>Changes in Temperature</td>\n",
+       "      <td></td>\n",
+       "      <td>Toxicology</td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224767</th>\n",
+       "      <td>RUE Temp</td>\n",
+       "      <td>RUE Temp</td>\n",
+       "      <td></td>\n",
+       "      <td>Cardiovascular</td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                           label            abbreviation      linksto  \\\n",
+       "itemid                                                                  \n",
+       "50825                TEMPERATURE                     NaN    labevents   \n",
+       "226170  Head of Bead Measurement         HOB Measurement  chartevents   \n",
+       "223762       Temperature Celsius           Temperature C  chartevents   \n",
+       "223761    Temperature Fahrenheit           Temperature F  chartevents   \n",
+       "678                Temperature F                          chartevents   \n",
+       "676                Temperature C                          chartevents   \n",
+       "591            RLE [Temperature]                          chartevents   \n",
+       "597            RUE [Temperature]                          chartevents   \n",
+       "224027          Skin Temperature               Skin Temp                \n",
+       "224642          Temperature Site               Temp Site                \n",
+       "645           Skin [Temperature]                          chartevents   \n",
+       "679         Temperature F (calc)                          chartevents   \n",
+       "677         Temperature C (calc)                          chartevents   \n",
+       "227054     TemperatureF_ApacheIV   TemperatureF_ApacheIV  chartevents   \n",
+       "224769                  LUE Temp                LUE Temp                \n",
+       "224771                  RLE Temp                RLE Temp                \n",
+       "224773                  LLE Temp                LLE Temp                \n",
+       "2798              arm 90 degrees                          chartevents   \n",
+       "224674    Changes in Temperature  Changes in Temperature                \n",
+       "224767                  RUE Temp                RUE Temp                \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "50825                BLOOD GAS      NaN  110.000000  \n",
+       "226170              Treatments   Degree  104.666667  \n",
+       "223762     Routine Vital Signs       ?C  104.666667  \n",
+       "223761     Routine Vital Signs       ?F  104.666667  \n",
+       "678                                      104.666667  \n",
+       "676                                      104.666667  \n",
+       "591                                       98.000000  \n",
+       "597                                       98.000000  \n",
+       "224027       Skin - Assessment            97.333333  \n",
+       "224642     Routine Vital Signs            97.333333  \n",
+       "645                                       95.666667  \n",
+       "679                                       92.333333  \n",
+       "677                                       92.333333  \n",
+       "227054  Scores - APACHE IV (2)       ?F   89.333333  \n",
+       "224769          Cardiovascular            88.000000  \n",
+       "224771          Cardiovascular            88.000000  \n",
+       "224773          Cardiovascular            88.000000  \n",
+       "2798                                      88.000000  \n",
+       "224674              Toxicology            88.000000  \n",
+       "224767          Cardiovascular            88.000000  "
+      ]
+     },
+     "execution_count": 82,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'temperature',\n",
+    "        'temp',\n",
+    "        'celcius',\n",
+    "        'farenheit',\n",
+    "        'degrees',\n",
+    "        'deg'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 83,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.TEMPERATURE_BODY] = [223761,678,223762,676]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Weight"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 97,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>763</th>\n",
+       "      <td>Daily Weight</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226512</th>\n",
+       "      <td>Admission Weight (Kg)</td>\n",
+       "      <td>Admission Weight (Kg)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>General</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226846</th>\n",
+       "      <td>Feeding Weight</td>\n",
+       "      <td>Feeding Weight</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>General</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224639</th>\n",
+       "      <td>Daily Weight</td>\n",
+       "      <td>Daily Weight</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>General</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3693</th>\n",
+       "      <td>Weight Kg</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>968</th>\n",
+       "      <td>EKG</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225402</th>\n",
+       "      <td>EKG</td>\n",
+       "      <td>EKG</td>\n",
+       "      <td>procedureevents_mv</td>\n",
+       "      <td>4-Procedures</td>\n",
+       "      <td>None</td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226184</th>\n",
+       "      <td>Estimated Protein Needs/Kg</td>\n",
+       "      <td>Estimated Protein Needs/Kg</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>General</td>\n",
+       "      <td>g/kg</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>733</th>\n",
+       "      <td>Weight Change</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>85.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226707</th>\n",
+       "      <td>Height</td>\n",
+       "      <td>Height</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>General</td>\n",
+       "      <td>Inch</td>\n",
+       "      <td>83.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4183</th>\n",
+       "      <td>Birthweight (kg)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228179</th>\n",
+       "      <td>ELWI (PiCCO)</td>\n",
+       "      <td>ELWI (PiCCO)</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>PiCCO</td>\n",
+       "      <td>ml/kg</td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>580</th>\n",
+       "      <td>Previous Weight</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43622</th>\n",
+       "      <td>cc/kg</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>581</th>\n",
+       "      <td>Previous WeightF</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7000</th>\n",
+       "      <td>ideal body weight</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45271</th>\n",
+       "      <td>Chucks Pad Weight</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3723</th>\n",
+       "      <td>Birth Weight    (kg)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3581</th>\n",
+       "      <td>Present Weight  (lb)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>76.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3692</th>\n",
+       "      <td>Weight Change  (gms)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>76.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                             label                abbreviation  \\\n",
+       "itemid                                                           \n",
+       "763                   Daily Weight                               \n",
+       "226512       Admission Weight (Kg)       Admission Weight (Kg)   \n",
+       "226846              Feeding Weight              Feeding Weight   \n",
+       "224639                Daily Weight                Daily Weight   \n",
+       "3693                     Weight Kg                               \n",
+       "968                            EKG                               \n",
+       "225402                         EKG                         EKG   \n",
+       "226184  Estimated Protein Needs/Kg  Estimated Protein Needs/Kg   \n",
+       "733                  Weight Change                               \n",
+       "226707                      Height                      Height   \n",
+       "4183              Birthweight (kg)                               \n",
+       "228179                ELWI (PiCCO)                ELWI (PiCCO)   \n",
+       "580                Previous Weight                               \n",
+       "43622                        cc/kg                               \n",
+       "581               Previous WeightF                               \n",
+       "7000             ideal body weight                               \n",
+       "45271            Chucks Pad Weight                               \n",
+       "3723          Birth Weight    (kg)                               \n",
+       "3581          Present Weight  (lb)                               \n",
+       "3692          Weight Change  (gms)                               \n",
+       "\n",
+       "                   linksto      category unitname       score  \n",
+       "itemid                                                         \n",
+       "763            chartevents                         110.000000  \n",
+       "226512         chartevents       General       kg  110.000000  \n",
+       "226846         chartevents       General       kg  110.000000  \n",
+       "224639         chartevents       General       kg  110.000000  \n",
+       "3693           chartevents                          96.666667  \n",
+       "968            chartevents                          96.666667  \n",
+       "225402  procedureevents_mv  4-Procedures     None   96.666667  \n",
+       "226184         chartevents       General     g/kg   88.000000  \n",
+       "733            chartevents                          85.333333  \n",
+       "226707         chartevents       General     Inch   83.000000  \n",
+       "4183           chartevents                          81.666667  \n",
+       "228179         chartevents         PiCCO    ml/kg   81.333333  \n",
+       "580            chartevents                          81.333333  \n",
+       "43622       inputevents_cv                          81.333333  \n",
+       "581            chartevents                          80.000000  \n",
+       "7000           chartevents                          78.000000  \n",
+       "45271       inputevents_cv                          78.000000  \n",
+       "3723           chartevents                          77.666667  \n",
+       "3581           chartevents                          76.000000  \n",
+       "3692           chartevents                          76.000000  "
+      ]
+     },
+     "execution_count": 97,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'weight',\n",
+    "        'daily weight',\n",
+    "        'kg' \n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 98,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.WEIGHT_BODY] =[763,224639,3693]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Urine Output"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 84,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>226560</th>\n",
+       "      <td>Void</td>\n",
+       "      <td>Void</td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Output</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43332</th>\n",
+       "      <td>void</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7672</th>\n",
+       "      <td>Foley</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3686</th>\n",
+       "      <td>Void</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45967</th>\n",
+       "      <td>foley</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43053</th>\n",
+       "      <td>URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226559</th>\n",
+       "      <td>Foley</td>\n",
+       "      <td>Foley</td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Output</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44103</th>\n",
+       "      <td>ER urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44834</th>\n",
+       "      <td>er urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227519</th>\n",
+       "      <td>Urine output_ApacheIV</td>\n",
+       "      <td>Urine output</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>None</td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44706</th>\n",
+       "      <td>urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42892</th>\n",
+       "      <td>EW URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45415</th>\n",
+       "      <td>ED Urine OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43987</th>\n",
+       "      <td>urine out or</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42666</th>\n",
+       "      <td>E.R. URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44237</th>\n",
+       "      <td>E.R. urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42592</th>\n",
+       "      <td>VICU URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40069</th>\n",
+       "      <td>Urine Out Void</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46423</th>\n",
+       "      <td>ed foley</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43931</th>\n",
+       "      <td>Floor urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                        label  abbreviation         linksto  \\\n",
+       "itemid                                                        \n",
+       "226560                   Void          Void    outputevents   \n",
+       "43332                    void                inputevents_cv   \n",
+       "7672                    Foley                   chartevents   \n",
+       "3686                     Void                   chartevents   \n",
+       "45967                   foley                inputevents_cv   \n",
+       "43053               URINE OUT                  outputevents   \n",
+       "226559                  Foley         Foley    outputevents   \n",
+       "44103            ER urine out                  outputevents   \n",
+       "44834            er urine out                  outputevents   \n",
+       "227519  Urine output_ApacheIV  Urine output     chartevents   \n",
+       "44706            urine output                  outputevents   \n",
+       "42892            EW URINE OUT                  outputevents   \n",
+       "45415            ED Urine OUT                  outputevents   \n",
+       "43987            urine out or                  outputevents   \n",
+       "42666          E.R. URINE OUT                  outputevents   \n",
+       "44237          E.R. urine out                  outputevents   \n",
+       "42592          VICU URINE OUT                  outputevents   \n",
+       "40069          Urine Out Void                  outputevents   \n",
+       "46423                ed foley                inputevents_cv   \n",
+       "43931         Floor urine out                  outputevents   \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "226560                  Output       mL  110.000000  \n",
+       "43332                                    110.000000  \n",
+       "7672                                     110.000000  \n",
+       "3686                                     110.000000  \n",
+       "45967                                    110.000000  \n",
+       "43053                                    110.000000  \n",
+       "226559                  Output       mL  110.000000  \n",
+       "44103                                    100.666667  \n",
+       "44834                                    100.666667  \n",
+       "227519  Scores - APACHE IV (2)     None  100.666667  \n",
+       "44706                                    100.666667  \n",
+       "42892                                    100.666667  \n",
+       "45415                                    100.666667  \n",
+       "43987                                    100.666667  \n",
+       "42666                                     96.666667  \n",
+       "44237                                     96.666667  \n",
+       "42592                                     95.333333  \n",
+       "40069                                     95.333333  \n",
+       "46423                                     94.666667  \n",
+       "43931                                     93.333333  "
+      ]
+     },
+     "execution_count": 84,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'urine out',\n",
+    "        'void',\n",
+    "        'foley'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 85,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>226560</th>\n",
+       "      <td>Void</td>\n",
+       "      <td>Void</td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Output</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43332</th>\n",
+       "      <td>void</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7672</th>\n",
+       "      <td>Foley</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3686</th>\n",
+       "      <td>Void</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45967</th>\n",
+       "      <td>foley</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43053</th>\n",
+       "      <td>URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226559</th>\n",
+       "      <td>Foley</td>\n",
+       "      <td>Foley</td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Output</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44103</th>\n",
+       "      <td>ER urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44834</th>\n",
+       "      <td>er urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227519</th>\n",
+       "      <td>Urine output_ApacheIV</td>\n",
+       "      <td>Urine output</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>None</td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44706</th>\n",
+       "      <td>urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42892</th>\n",
+       "      <td>EW URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45415</th>\n",
+       "      <td>ED Urine OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43987</th>\n",
+       "      <td>urine out or</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42666</th>\n",
+       "      <td>E.R. URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44237</th>\n",
+       "      <td>E.R. urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42592</th>\n",
+       "      <td>VICU URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40069</th>\n",
+       "      <td>Urine Out Void</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46423</th>\n",
+       "      <td>ed foley</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>94.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43931</th>\n",
+       "      <td>Floor urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43348</th>\n",
+       "      <td>urine output/kg</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40405</th>\n",
+       "      <td>Urine Out Other</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42810</th>\n",
+       "      <td>angio urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46180</th>\n",
+       "      <td>urine out-angio</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40055</th>\n",
+       "      <td>Urine Out Foley</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44253</th>\n",
+       "      <td>Urine out angio</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44325</th>\n",
+       "      <td>ED URINE OUTPUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>41857</th>\n",
+       "      <td>urine out in er</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44824</th>\n",
+       "      <td>EW urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45991</th>\n",
+       "      <td>ew-urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42042</th>\n",
+       "      <td>ANGIO URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46177</th>\n",
+       "      <td>URINE OUT-ANGIO</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44684</th>\n",
+       "      <td>floor urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46658</th>\n",
+       "      <td>ED Urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46578</th>\n",
+       "      <td>URINE OUTPUT-ER</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42765</th>\n",
+       "      <td>FARR 6 URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>91.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>70081</th>\n",
+       "      <td>URINE</td>\n",
+       "      <td></td>\n",
+       "      <td>microbiologyevents</td>\n",
+       "      <td>SPECIMEN</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3819</th>\n",
+       "      <td>Urine Leukocytes</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Urine</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>70079</th>\n",
+       "      <td>URINE</td>\n",
+       "      <td></td>\n",
+       "      <td>microbiologyevents</td>\n",
+       "      <td>SPECIMEN</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43462</th>\n",
+       "      <td>urine</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                        label  abbreviation             linksto  \\\n",
+       "itemid                                                            \n",
+       "226560                   Void          Void        outputevents   \n",
+       "43332                    void                    inputevents_cv   \n",
+       "7672                    Foley                       chartevents   \n",
+       "3686                     Void                       chartevents   \n",
+       "45967                   foley                    inputevents_cv   \n",
+       "43053               URINE OUT                      outputevents   \n",
+       "226559                  Foley         Foley        outputevents   \n",
+       "44103            ER urine out                      outputevents   \n",
+       "44834            er urine out                      outputevents   \n",
+       "227519  Urine output_ApacheIV  Urine output         chartevents   \n",
+       "44706            urine output                      outputevents   \n",
+       "42892            EW URINE OUT                      outputevents   \n",
+       "45415            ED Urine OUT                      outputevents   \n",
+       "43987            urine out or                      outputevents   \n",
+       "42666          E.R. URINE OUT                      outputevents   \n",
+       "44237          E.R. urine out                      outputevents   \n",
+       "42592          VICU URINE OUT                      outputevents   \n",
+       "40069          Urine Out Void                      outputevents   \n",
+       "46423                ed foley                    inputevents_cv   \n",
+       "43931         Floor urine out                      outputevents   \n",
+       "43348         urine output/kg                      outputevents   \n",
+       "40405         Urine Out Other                      outputevents   \n",
+       "42810         angio urine out                      outputevents   \n",
+       "46180         urine out-angio                      outputevents   \n",
+       "40055         Urine Out Foley                      outputevents   \n",
+       "44253         Urine out angio                      outputevents   \n",
+       "44325         ED URINE OUTPUT                      outputevents   \n",
+       "41857         urine out in er                      outputevents   \n",
+       "44824         EW urine output                      outputevents   \n",
+       "45991         ew-urine output                      outputevents   \n",
+       "42042         ANGIO URINE OUT                      outputevents   \n",
+       "46177         URINE OUT-ANGIO                      outputevents   \n",
+       "44684         floor urine out                      outputevents   \n",
+       "46658         ED Urine output                      outputevents   \n",
+       "46578         URINE OUTPUT-ER                      outputevents   \n",
+       "42765        FARR 6 URINE OUT                      outputevents   \n",
+       "70081                   URINE                microbiologyevents   \n",
+       "3819         Urine Leukocytes                       chartevents   \n",
+       "70079                   URINE                microbiologyevents   \n",
+       "43462                   urine                      outputevents   \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "226560                  Output       mL  110.000000  \n",
+       "43332                                    110.000000  \n",
+       "7672                                     110.000000  \n",
+       "3686                                     110.000000  \n",
+       "45967                                    110.000000  \n",
+       "43053                                    110.000000  \n",
+       "226559                  Output       mL  110.000000  \n",
+       "44103                                    100.666667  \n",
+       "44834                                    100.666667  \n",
+       "227519  Scores - APACHE IV (2)     None  100.666667  \n",
+       "44706                                    100.666667  \n",
+       "42892                                    100.666667  \n",
+       "45415                                    100.666667  \n",
+       "43987                                    100.666667  \n",
+       "42666                                     96.666667  \n",
+       "44237                                     96.666667  \n",
+       "42592                                     95.333333  \n",
+       "40069                                     95.333333  \n",
+       "46423                                     94.666667  \n",
+       "43931                                     93.333333  \n",
+       "43348                                     93.333333  \n",
+       "40405                                     93.333333  \n",
+       "42810                                     93.333333  \n",
+       "46180                                     93.333333  \n",
+       "40055                                     93.333333  \n",
+       "44253                                     93.333333  \n",
+       "44325                                     93.333333  \n",
+       "41857                                     93.333333  \n",
+       "44824                                     93.333333  \n",
+       "45991                                     93.333333  \n",
+       "42042                                     93.333333  \n",
+       "46177                                     93.333333  \n",
+       "44684                                     93.333333  \n",
+       "46658                                     93.333333  \n",
+       "46578                                     93.333333  \n",
+       "42765                                     91.333333  \n",
+       "70081                 SPECIMEN            90.666667  \n",
+       "3819                     Urine            90.666667  \n",
+       "70079                 SPECIMEN            90.666667  \n",
+       "43462                                     90.666667  "
+      ]
+     },
+     "execution_count": 85,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df.head(40)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 86,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "out_df = out_df[out_df.linksto.isin(['outputevents','chartevents'])]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 87,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>226560</th>\n",
+       "      <td>Void</td>\n",
+       "      <td>Void</td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Output</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7672</th>\n",
+       "      <td>Foley</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3686</th>\n",
+       "      <td>Void</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43053</th>\n",
+       "      <td>URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226559</th>\n",
+       "      <td>Foley</td>\n",
+       "      <td>Foley</td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td>Output</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44103</th>\n",
+       "      <td>ER urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44834</th>\n",
+       "      <td>er urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227519</th>\n",
+       "      <td>Urine output_ApacheIV</td>\n",
+       "      <td>Urine output</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>None</td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44706</th>\n",
+       "      <td>urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42892</th>\n",
+       "      <td>EW URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45415</th>\n",
+       "      <td>ED Urine OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43987</th>\n",
+       "      <td>urine out or</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42666</th>\n",
+       "      <td>E.R. URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44237</th>\n",
+       "      <td>E.R. urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42592</th>\n",
+       "      <td>VICU URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40069</th>\n",
+       "      <td>Urine Out Void</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>95.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43931</th>\n",
+       "      <td>Floor urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43348</th>\n",
+       "      <td>urine output/kg</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40405</th>\n",
+       "      <td>Urine Out Other</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42810</th>\n",
+       "      <td>angio urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46180</th>\n",
+       "      <td>urine out-angio</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40055</th>\n",
+       "      <td>Urine Out Foley</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44253</th>\n",
+       "      <td>Urine out angio</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44325</th>\n",
+       "      <td>ED URINE OUTPUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>41857</th>\n",
+       "      <td>urine out in er</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44824</th>\n",
+       "      <td>EW urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45991</th>\n",
+       "      <td>ew-urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42042</th>\n",
+       "      <td>ANGIO URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46177</th>\n",
+       "      <td>URINE OUT-ANGIO</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44684</th>\n",
+       "      <td>floor urine out</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46658</th>\n",
+       "      <td>ED Urine output</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46578</th>\n",
+       "      <td>URINE OUTPUT-ER</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>93.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42765</th>\n",
+       "      <td>FARR 6 URINE OUT</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>91.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3819</th>\n",
+       "      <td>Urine Leukocytes</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Urine</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43462</th>\n",
+       "      <td>urine</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3816</th>\n",
+       "      <td>Urine Glucose</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Urine</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3817</th>\n",
+       "      <td>Urine Heme</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Urine</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3818</th>\n",
+       "      <td>Urine Ketones</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Urine</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3822</th>\n",
+       "      <td>Urine Protein</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Urine</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6298</th>\n",
+       "      <td>foley d/c</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                        label  abbreviation       linksto  \\\n",
+       "itemid                                                      \n",
+       "226560                   Void          Void  outputevents   \n",
+       "7672                    Foley                 chartevents   \n",
+       "3686                     Void                 chartevents   \n",
+       "43053               URINE OUT                outputevents   \n",
+       "226559                  Foley         Foley  outputevents   \n",
+       "44103            ER urine out                outputevents   \n",
+       "44834            er urine out                outputevents   \n",
+       "227519  Urine output_ApacheIV  Urine output   chartevents   \n",
+       "44706            urine output                outputevents   \n",
+       "42892            EW URINE OUT                outputevents   \n",
+       "45415            ED Urine OUT                outputevents   \n",
+       "43987            urine out or                outputevents   \n",
+       "42666          E.R. URINE OUT                outputevents   \n",
+       "44237          E.R. urine out                outputevents   \n",
+       "42592          VICU URINE OUT                outputevents   \n",
+       "40069          Urine Out Void                outputevents   \n",
+       "43931         Floor urine out                outputevents   \n",
+       "43348         urine output/kg                outputevents   \n",
+       "40405         Urine Out Other                outputevents   \n",
+       "42810         angio urine out                outputevents   \n",
+       "46180         urine out-angio                outputevents   \n",
+       "40055         Urine Out Foley                outputevents   \n",
+       "44253         Urine out angio                outputevents   \n",
+       "44325         ED URINE OUTPUT                outputevents   \n",
+       "41857         urine out in er                outputevents   \n",
+       "44824         EW urine output                outputevents   \n",
+       "45991         ew-urine output                outputevents   \n",
+       "42042         ANGIO URINE OUT                outputevents   \n",
+       "46177         URINE OUT-ANGIO                outputevents   \n",
+       "44684         floor urine out                outputevents   \n",
+       "46658         ED Urine output                outputevents   \n",
+       "46578         URINE OUTPUT-ER                outputevents   \n",
+       "42765        FARR 6 URINE OUT                outputevents   \n",
+       "3819         Urine Leukocytes                 chartevents   \n",
+       "43462                   urine                outputevents   \n",
+       "3816            Urine Glucose                 chartevents   \n",
+       "3817               Urine Heme                 chartevents   \n",
+       "3818            Urine Ketones                 chartevents   \n",
+       "3822            Urine Protein                 chartevents   \n",
+       "6298                foley d/c                 chartevents   \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "226560                  Output       mL  110.000000  \n",
+       "7672                                     110.000000  \n",
+       "3686                                     110.000000  \n",
+       "43053                                    110.000000  \n",
+       "226559                  Output       mL  110.000000  \n",
+       "44103                                    100.666667  \n",
+       "44834                                    100.666667  \n",
+       "227519  Scores - APACHE IV (2)     None  100.666667  \n",
+       "44706                                    100.666667  \n",
+       "42892                                    100.666667  \n",
+       "45415                                    100.666667  \n",
+       "43987                                    100.666667  \n",
+       "42666                                     96.666667  \n",
+       "44237                                     96.666667  \n",
+       "42592                                     95.333333  \n",
+       "40069                                     95.333333  \n",
+       "43931                                     93.333333  \n",
+       "43348                                     93.333333  \n",
+       "40405                                     93.333333  \n",
+       "42810                                     93.333333  \n",
+       "46180                                     93.333333  \n",
+       "40055                                     93.333333  \n",
+       "44253                                     93.333333  \n",
+       "44325                                     93.333333  \n",
+       "41857                                     93.333333  \n",
+       "44824                                     93.333333  \n",
+       "45991                                     93.333333  \n",
+       "42042                                     93.333333  \n",
+       "46177                                     93.333333  \n",
+       "44684                                     93.333333  \n",
+       "46658                                     93.333333  \n",
+       "46578                                     93.333333  \n",
+       "42765                                     91.333333  \n",
+       "3819                     Urine            90.666667  \n",
+       "43462                                     90.666667  \n",
+       "3816                     Urine            90.666667  \n",
+       "3817                     Urine            90.666667  \n",
+       "3818                     Urine            90.666667  \n",
+       "3822                     Urine            90.666667  \n",
+       "6298                                      90.666667  "
+      ]
+     },
+     "execution_count": 87,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df.head(40)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 91,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "out_df.drop(227519,axis=0,inplace=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 96,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.OUTPUT_URINE] = out_df.loc[:46578].index.unique().tolist()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "https://github.com/MIT-LCP/mimic-code/blob/travis/concepts/cookbook/uo.sql"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.OUTPUT_URINE] = keep_dict[data_dict.labels.OUTPUT_URINE]\n",
+    "to_add = [43175,40094,40715,40473,40085,40057,40056,40428,40086,40096,40651]\n",
+    "to_add += [227510,226561,226584,226563,226564,226565,226567,226557,226558  ]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Glasgow Coma Scale (GCS)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Eye Opening"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 99,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>184</th>\n",
+       "      <td>Eye Opening</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220739</th>\n",
+       "      <td>GCS - Eye Opening</td>\n",
+       "      <td>Eye Opening</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>198</th>\n",
+       "      <td>GCS Total</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>70033</th>\n",
+       "      <td>EYE</td>\n",
+       "      <td></td>\n",
+       "      <td>microbiologyevents</td>\n",
+       "      <td>SPECIMEN</td>\n",
+       "      <td></td>\n",
+       "      <td>72.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3742</th>\n",
+       "      <td>Basos</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3791</th>\n",
+       "      <td>Polys</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3779</th>\n",
+       "      <td>Monos</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2834</th>\n",
+       "      <td>ICS</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227011</th>\n",
+       "      <td>GCSEye_ApacheIV</td>\n",
+       "      <td>GCSEye_ApacheIV</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td></td>\n",
+       "      <td>65.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226755</th>\n",
+       "      <td>GcsApacheIIScore</td>\n",
+       "      <td>GcsApacheIIScore</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>None</td>\n",
+       "      <td>64.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>41556</th>\n",
+       "      <td>ng</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>64.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227012</th>\n",
+       "      <td>GCSMotor_ApacheIV</td>\n",
+       "      <td>GCSMotor_ApacheIV</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td></td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227013</th>\n",
+       "      <td>GcsScore_ApacheIV</td>\n",
+       "      <td>GcsScore_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>None</td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5700</th>\n",
+       "      <td>Gent eye oint</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>63.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227014</th>\n",
+       "      <td>GCSVerbal_ApacheIV</td>\n",
+       "      <td>GCSVerbal_ApacheIV</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td></td>\n",
+       "      <td>62.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50931</th>\n",
+       "      <td>GLUCOSE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>CHEMISTRY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>62.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1529</th>\n",
+       "      <td>Glucose</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Chemistry</td>\n",
+       "      <td></td>\n",
+       "      <td>62.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50809</th>\n",
+       "      <td>GLUCOSE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>62.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51478</th>\n",
+       "      <td>GLUCOSE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>62.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223901</th>\n",
+       "      <td>GCS - Motor Response</td>\n",
+       "      <td>Motor Response</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>61.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                       label        abbreviation             linksto  \\\n",
+       "itemid                                                                 \n",
+       "184              Eye Opening                             chartevents   \n",
+       "220739     GCS - Eye Opening         Eye Opening                       \n",
+       "198                GCS Total                             chartevents   \n",
+       "70033                    EYE                      microbiologyevents   \n",
+       "3742                   Basos                             chartevents   \n",
+       "3791                   Polys                             chartevents   \n",
+       "3779                   Monos                             chartevents   \n",
+       "2834                     ICS                             chartevents   \n",
+       "227011       GCSEye_ApacheIV     GCSEye_ApacheIV                       \n",
+       "226755      GcsApacheIIScore    GcsApacheIIScore         chartevents   \n",
+       "41556                     ng                          inputevents_cv   \n",
+       "227012     GCSMotor_ApacheIV   GCSMotor_ApacheIV                       \n",
+       "227013     GcsScore_ApacheIV   GcsScore_ApacheIV         chartevents   \n",
+       "5700           Gent eye oint                             chartevents   \n",
+       "227014    GCSVerbal_ApacheIV  GCSVerbal_ApacheIV                       \n",
+       "50931                GLUCOSE                 NaN           labevents   \n",
+       "1529                 Glucose                             chartevents   \n",
+       "50809                GLUCOSE                 NaN           labevents   \n",
+       "51478                GLUCOSE                 NaN           labevents   \n",
+       "223901  GCS - Motor Response      Motor Response                       \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "184                                      110.000000  \n",
+       "220739            Neurological           110.000000  \n",
+       "198                                       76.666667  \n",
+       "70033                 SPECIMEN            72.000000  \n",
+       "3742                       CSF            71.333333  \n",
+       "3791                       CSF            71.333333  \n",
+       "3779                       CSF            71.333333  \n",
+       "2834                                      67.000000  \n",
+       "227011  Scores - APACHE IV (2)            65.333333  \n",
+       "226755      Scores - APACHE II     None   64.666667  \n",
+       "41556                                     64.000000  \n",
+       "227012  Scores - APACHE IV (2)            63.333333  \n",
+       "227013  Scores - APACHE IV (2)     None   63.333333  \n",
+       "5700                                      63.000000  \n",
+       "227014  Scores - APACHE IV (2)            62.666667  \n",
+       "50931                CHEMISTRY      NaN   62.333333  \n",
+       "1529                 Chemistry            62.333333  \n",
+       "50809                BLOOD GAS      NaN   62.333333  \n",
+       "51478               HEMATOLOGY      NaN   62.333333  \n",
+       "223901            Neurological            61.666667  "
+      ]
+     },
+     "execution_count": 99,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'glasgow come scale',\n",
+    "        'GCS',\n",
+    "        'eye opening'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 100,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.GLASGOW_COMA_SCALE_EYE_OPENING] = [184,220739]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Motor"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 101,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>228405</th>\n",
+       "      <td>Motor L Leg</td>\n",
+       "      <td>Motor L Leg</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>85.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228404</th>\n",
+       "      <td>Motor L Arm</td>\n",
+       "      <td>Motor L Arm</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>85.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228407</th>\n",
+       "      <td>Motor R Leg</td>\n",
+       "      <td>Motor R Leg</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>85.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228406</th>\n",
+       "      <td>Motor R Arm</td>\n",
+       "      <td>Motor R Arm</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>85.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227120</th>\n",
+       "      <td>Motor Deficit</td>\n",
+       "      <td>Motor Deficit</td>\n",
+       "      <td></td>\n",
+       "      <td>Pain/Sedation</td>\n",
+       "      <td></td>\n",
+       "      <td>80.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>453</th>\n",
+       "      <td>Motor Deficits</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>454</th>\n",
+       "      <td>Motor Response</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>223901</th>\n",
+       "      <td>GCS - Motor Response</td>\n",
+       "      <td>Motor Response</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>198</th>\n",
+       "      <td>GCS Total</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227012</th>\n",
+       "      <td>GCSMotor_ApacheIV</td>\n",
+       "      <td>GCSMotor_ApacheIV</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td></td>\n",
+       "      <td>73.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3779</th>\n",
+       "      <td>Monos</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3742</th>\n",
+       "      <td>Basos</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3791</th>\n",
+       "      <td>Polys</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226757</th>\n",
+       "      <td>GCSMotorApacheIIValue</td>\n",
+       "      <td>GCSMotorApacheIIValue</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td></td>\n",
+       "      <td>68.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2834</th>\n",
+       "      <td>ICS</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225472</th>\n",
+       "      <td>Pneumothorax</td>\n",
+       "      <td>Pneumothorax</td>\n",
+       "      <td>procedureevents_mv</td>\n",
+       "      <td>3-Significant Events</td>\n",
+       "      <td>None</td>\n",
+       "      <td>66.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227011</th>\n",
+       "      <td>GCSEye_ApacheIV</td>\n",
+       "      <td>GCSEye_ApacheIV</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td></td>\n",
+       "      <td>65.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226755</th>\n",
+       "      <td>GcsApacheIIScore</td>\n",
+       "      <td>GcsApacheIIScore</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td>None</td>\n",
+       "      <td>64.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220739</th>\n",
+       "      <td>GCS - Eye Opening</td>\n",
+       "      <td>Eye Opening</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>64.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227013</th>\n",
+       "      <td>GcsScore_ApacheIV</td>\n",
+       "      <td>GcsScore_ApacheIV</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td>None</td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                        label           abbreviation             linksto  \\\n",
+       "itemid                                                                     \n",
+       "228405            Motor L Leg            Motor L Leg                       \n",
+       "228404            Motor L Arm            Motor L Arm                       \n",
+       "228407            Motor R Leg            Motor R Leg                       \n",
+       "228406            Motor R Arm            Motor R Arm                       \n",
+       "227120          Motor Deficit          Motor Deficit                       \n",
+       "453            Motor Deficits                                chartevents   \n",
+       "454            Motor Response                                chartevents   \n",
+       "223901   GCS - Motor Response         Motor Response                       \n",
+       "198                 GCS Total                                chartevents   \n",
+       "227012      GCSMotor_ApacheIV      GCSMotor_ApacheIV                       \n",
+       "3779                    Monos                                chartevents   \n",
+       "3742                    Basos                                chartevents   \n",
+       "3791                    Polys                                chartevents   \n",
+       "226757  GCSMotorApacheIIValue  GCSMotorApacheIIValue                       \n",
+       "2834                      ICS                                chartevents   \n",
+       "225472           Pneumothorax           Pneumothorax  procedureevents_mv   \n",
+       "227011        GCSEye_ApacheIV        GCSEye_ApacheIV                       \n",
+       "226755       GcsApacheIIScore       GcsApacheIIScore         chartevents   \n",
+       "220739      GCS - Eye Opening            Eye Opening                       \n",
+       "227013      GcsScore_ApacheIV      GcsScore_ApacheIV         chartevents   \n",
+       "\n",
+       "                      category unitname      score  \n",
+       "itemid                                              \n",
+       "228405            Neurological           85.333333  \n",
+       "228404            Neurological           85.333333  \n",
+       "228407            Neurological           85.333333  \n",
+       "228406            Neurological           85.333333  \n",
+       "227120           Pain/Sedation           80.666667  \n",
+       "453                                      78.666667  \n",
+       "454                                      78.666667  \n",
+       "223901            Neurological           78.666667  \n",
+       "198                                      76.666667  \n",
+       "227012  Scores - APACHE IV (2)           73.333333  \n",
+       "3779                       CSF           71.333333  \n",
+       "3742                       CSF           71.333333  \n",
+       "3791                       CSF           71.333333  \n",
+       "226757      Scores - APACHE II           68.666667  \n",
+       "2834                                     67.000000  \n",
+       "225472    3-Significant Events     None  66.000000  \n",
+       "227011  Scores - APACHE IV (2)           65.333333  \n",
+       "226755      Scores - APACHE II     None  64.666667  \n",
+       "220739            Neurological           64.333333  \n",
+       "227013  Scores - APACHE IV (2)     None  63.333333  "
+      ]
+     },
+     "execution_count": 101,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'glasgow come scale',\n",
+    "        'GCS',\n",
+    "        'motor',\n",
+    "        'motor response'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 102,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.GLASGOW_COMA_SCALE_MOTOR] = [454,223901]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Verbal"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 103,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>223900</th>\n",
+       "      <td>GCS - Verbal Response</td>\n",
+       "      <td>Verbal Response</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>723</th>\n",
+       "      <td>Verbal Response</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224756</th>\n",
+       "      <td>Response</td>\n",
+       "      <td>Response</td>\n",
+       "      <td></td>\n",
+       "      <td>Neurological</td>\n",
+       "      <td></td>\n",
+       "      <td>90.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>41610</th>\n",
+       "      <td>ER</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227014</th>\n",
+       "      <td>GCSVerbal_ApacheIV</td>\n",
+       "      <td>GCSVerbal_ApacheIV</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE IV (2)</td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44473</th>\n",
+       "      <td>er</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>198</th>\n",
+       "      <td>GCS Total</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226758</th>\n",
+       "      <td>GCSVerbalApacheIIValue</td>\n",
+       "      <td>GCSVerbalApacheIIValue</td>\n",
+       "      <td></td>\n",
+       "      <td>Scores - APACHE II</td>\n",
+       "      <td></td>\n",
+       "      <td>72.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3779</th>\n",
+       "      <td>Monos</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3742</th>\n",
+       "      <td>Basos</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3791</th>\n",
+       "      <td>Polys</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>CSF</td>\n",
+       "      <td></td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224413</th>\n",
+       "      <td>TOF Response</td>\n",
+       "      <td>TOF Response</td>\n",
+       "      <td></td>\n",
+       "      <td>Pain/Sedation</td>\n",
+       "      <td></td>\n",
+       "      <td>69.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>40450</th>\n",
+       "      <td>EBL</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>41693</th>\n",
+       "      <td>Verapamil</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1968</th>\n",
+       "      <td>Verapamil</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42047</th>\n",
+       "      <td>ebl</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>222318</th>\n",
+       "      <td>Verapamil</td>\n",
+       "      <td>Verapamil</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46484</th>\n",
+       "      <td>verapamil</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2834</th>\n",
+       "      <td>ICS</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>224409</th>\n",
+       "      <td>Pain Level Response</td>\n",
+       "      <td>Pain Level Response</td>\n",
+       "      <td></td>\n",
+       "      <td>Pain/Sedation</td>\n",
+       "      <td></td>\n",
+       "      <td>66.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                         label            abbreviation         linksto  \\\n",
+       "itemid                                                                   \n",
+       "223900   GCS - Verbal Response         Verbal Response                   \n",
+       "723            Verbal Response                             chartevents   \n",
+       "224756                Response                Response                   \n",
+       "41610                       ER                          inputevents_cv   \n",
+       "227014      GCSVerbal_ApacheIV      GCSVerbal_ApacheIV                   \n",
+       "44473                       er                          inputevents_cv   \n",
+       "198                  GCS Total                             chartevents   \n",
+       "226758  GCSVerbalApacheIIValue  GCSVerbalApacheIIValue                   \n",
+       "3779                     Monos                             chartevents   \n",
+       "3742                     Basos                             chartevents   \n",
+       "3791                     Polys                             chartevents   \n",
+       "224413            TOF Response            TOF Response                   \n",
+       "40450                      EBL                          inputevents_cv   \n",
+       "41693                Verapamil                          inputevents_cv   \n",
+       "1968                 Verapamil                             chartevents   \n",
+       "42047                      ebl                          inputevents_cv   \n",
+       "222318               Verapamil               Verapamil  inputevents_mv   \n",
+       "46484                verapamil                          inputevents_cv   \n",
+       "2834                       ICS                             chartevents   \n",
+       "224409     Pain Level Response     Pain Level Response                   \n",
+       "\n",
+       "                      category unitname       score  \n",
+       "itemid                                               \n",
+       "223900            Neurological           110.000000  \n",
+       "723                                      110.000000  \n",
+       "224756            Neurological            90.000000  \n",
+       "41610         Free Form Intake            76.666667  \n",
+       "227014  Scores - APACHE IV (2)            76.666667  \n",
+       "44473         Free Form Intake            76.666667  \n",
+       "198                                       76.666667  \n",
+       "226758      Scores - APACHE II            72.000000  \n",
+       "3779                       CSF            71.333333  \n",
+       "3742                       CSF            71.333333  \n",
+       "3791                       CSF            71.333333  \n",
+       "224413           Pain/Sedation            69.666667  \n",
+       "40450                                     67.000000  \n",
+       "41693         Free Form Intake            67.000000  \n",
+       "1968                                      67.000000  \n",
+       "42047                                     67.000000  \n",
+       "222318             Medications       mg   67.000000  \n",
+       "46484         Free Form Intake            67.000000  \n",
+       "2834                                      67.000000  \n",
+       "224409           Pain/Sedation            66.000000  "
+      ]
+     },
+     "execution_count": 103,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'glasgow come scale',\n",
+    "        'GCS',\n",
+    "        'verbal',\n",
+    "        'verbal response'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 104,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.GLASGOW_COMA_SCALE_VERBAL] = [723,223900]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Labs\n",
+    "\n",
+    "### Lactate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 105,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>1531</th>\n",
+       "      <td>Lactic Acid</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Chemistry</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225668</th>\n",
+       "      <td>Lactic Acid</td>\n",
+       "      <td>Lactic Acid</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>None</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50813</th>\n",
+       "      <td>LACTATE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220228</th>\n",
+       "      <td>Hemoglobin</td>\n",
+       "      <td>Hemoglobin</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>g/dl</td>\n",
+       "      <td>102.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2773</th>\n",
+       "      <td>sjlactate</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>102.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225835</th>\n",
+       "      <td>Na Phos</td>\n",
+       "      <td>Na Phos</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mmol</td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225834</th>\n",
+       "      <td>K Phos</td>\n",
+       "      <td>K Phos</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mmol</td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227526</th>\n",
+       "      <td>Citrate</td>\n",
+       "      <td>Citrate</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mmol</td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225925</th>\n",
+       "      <td>Potassium Phosphate</td>\n",
+       "      <td>Potassium Phosphate</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Nutrition - Supplements</td>\n",
+       "      <td>mmol</td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>818</th>\n",
+       "      <td>Lactic Acid(0.5-2.0)</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Chemistry</td>\n",
+       "      <td></td>\n",
+       "      <td>91.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220955</th>\n",
+       "      <td>Ringers Lactate</td>\n",
+       "      <td>Ringers Lactate</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>86.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2638</th>\n",
+       "      <td>CEREBRAL LACTATE</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1634</th>\n",
+       "      <td>lactated ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30021</th>\n",
+       "      <td>Lactated Ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1520</th>\n",
+       "      <td>ACT</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Coags</td>\n",
+       "      <td></td>\n",
+       "      <td>83.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220507</th>\n",
+       "      <td>Activated Clotting Time</td>\n",
+       "      <td>ACT</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>None</td>\n",
+       "      <td>83.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1671</th>\n",
+       "      <td>act</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>83.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221319</th>\n",
+       "      <td>Alteplase (TPA)</td>\n",
+       "      <td>Alteplase (TPA)</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221347</th>\n",
+       "      <td>Amiodarone</td>\n",
+       "      <td>Amiodarone</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221342</th>\n",
+       "      <td>Aminophylline</td>\n",
+       "      <td>Aminophylline</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                          label         abbreviation         linksto  \\\n",
+       "itemid                                                                 \n",
+       "1531                Lactic Acid                          chartevents   \n",
+       "225668              Lactic Acid          Lactic Acid     chartevents   \n",
+       "50813                   LACTATE                  NaN       labevents   \n",
+       "220228               Hemoglobin           Hemoglobin     chartevents   \n",
+       "2773                  sjlactate                          chartevents   \n",
+       "225835                  Na Phos              Na Phos  inputevents_mv   \n",
+       "225834                   K Phos               K Phos  inputevents_mv   \n",
+       "227526                  Citrate              Citrate  inputevents_mv   \n",
+       "225925      Potassium Phosphate  Potassium Phosphate  inputevents_mv   \n",
+       "818        Lactic Acid(0.5-2.0)                          chartevents   \n",
+       "220955          Ringers Lactate      Ringers Lactate  inputevents_mv   \n",
+       "2638           CEREBRAL LACTATE                          chartevents   \n",
+       "1634           lactated ringers                          chartevents   \n",
+       "30021          Lactated Ringers                       inputevents_cv   \n",
+       "1520                        ACT                          chartevents   \n",
+       "220507  Activated Clotting Time                  ACT     chartevents   \n",
+       "1671                        act                          chartevents   \n",
+       "221319          Alteplase (TPA)      Alteplase (TPA)  inputevents_mv   \n",
+       "221347               Amiodarone           Amiodarone  inputevents_mv   \n",
+       "221342            Aminophylline        Aminophylline  inputevents_mv   \n",
+       "\n",
+       "                           category unitname       score  \n",
+       "itemid                                                    \n",
+       "1531                      Chemistry           110.000000  \n",
+       "225668                         Labs     None  110.000000  \n",
+       "50813                     BLOOD GAS      NaN  110.000000  \n",
+       "220228                         Labs     g/dl  102.666667  \n",
+       "2773                                          102.000000  \n",
+       "225835                  Medications     mmol   96.666667  \n",
+       "225834                  Medications     mmol   96.666667  \n",
+       "227526                  Medications     mmol   96.666667  \n",
+       "225925      Nutrition - Supplements     mmol   96.666667  \n",
+       "818                       Chemistry            91.333333  \n",
+       "220955  Fluids - Other (Not In Use)       mL   86.000000  \n",
+       "2638                                           84.000000  \n",
+       "1634                                           84.000000  \n",
+       "30021                                          84.000000  \n",
+       "1520                          Coags            83.333333  \n",
+       "220507                         Labs     None   83.333333  \n",
+       "1671                                           83.333333  \n",
+       "221319                  Medications       mg   81.333333  \n",
+       "221347                  Medications       mg   81.333333  \n",
+       "221342                  Medications       mg   81.333333  "
+      ]
+     },
+     "execution_count": 105,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'lactate',\n",
+    "        'lactic acid',\n",
+    "        'mmol/L',\n",
+    "        'mg/dL'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 106,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.LACTATE] = [1531,50813,225668,818]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Hemoglobin"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 107,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>51222</th>\n",
+       "      <td>HEMOGLOBIN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220228</th>\n",
+       "      <td>Hemoglobin</td>\n",
+       "      <td>Hemoglobin</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>g/dl</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>814</th>\n",
+       "      <td>Hemoglobin</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Hematology</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1165</th>\n",
+       "      <td>Hgb</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50811</th>\n",
+       "      <td>HEMOGLOBIN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51225</th>\n",
+       "      <td>HEMOGLOBIN F</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>104.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51224</th>\n",
+       "      <td>HEMOGLOBIN C</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>104.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50814</th>\n",
+       "      <td>METHEMOGLOBIN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>101.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51223</th>\n",
+       "      <td>HEMOGLOBIN A2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>101.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7965</th>\n",
+       "      <td>methhemoglobin</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>98.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50852</th>\n",
+       "      <td>% HEMOGLOBIN A1C</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>CHEMISTRY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51212</th>\n",
+       "      <td>FETAL HEMOGLOBIN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50805</th>\n",
+       "      <td>CARBOXYHEMOGLOBIN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>92.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50855</th>\n",
+       "      <td>ABSOLUTE HEMOGLOBIN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>CHEMISTRY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>89.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51226</th>\n",
+       "      <td>HEMOGLOBLIN A</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51227</th>\n",
+       "      <td>HEMOGLOBLIN S</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42232</th>\n",
+       "      <td>THYMOGLOBLIN</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45486</th>\n",
+       "      <td>Hemo</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42117</th>\n",
+       "      <td>THYMOGLOBULIN</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>78.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50934</th>\n",
+       "      <td>H</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>CHEMISTRY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>76.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                      label abbreviation         linksto          category  \\\n",
+       "itemid                                                                       \n",
+       "51222            HEMOGLOBIN          NaN       labevents        HEMATOLOGY   \n",
+       "220228           Hemoglobin   Hemoglobin     chartevents              Labs   \n",
+       "814              Hemoglobin                  chartevents        Hematology   \n",
+       "1165                    Hgb                  chartevents                     \n",
+       "50811            HEMOGLOBIN          NaN       labevents         BLOOD GAS   \n",
+       "51225          HEMOGLOBIN F          NaN       labevents        HEMATOLOGY   \n",
+       "51224          HEMOGLOBIN C          NaN       labevents        HEMATOLOGY   \n",
+       "50814         METHEMOGLOBIN          NaN       labevents         BLOOD GAS   \n",
+       "51223         HEMOGLOBIN A2          NaN       labevents        HEMATOLOGY   \n",
+       "7965         methhemoglobin                  chartevents                     \n",
+       "50852      % HEMOGLOBIN A1C          NaN       labevents         CHEMISTRY   \n",
+       "51212      FETAL HEMOGLOBIN          NaN       labevents        HEMATOLOGY   \n",
+       "50805     CARBOXYHEMOGLOBIN          NaN       labevents         BLOOD GAS   \n",
+       "50855   ABSOLUTE HEMOGLOBIN          NaN       labevents         CHEMISTRY   \n",
+       "51226         HEMOGLOBLIN A          NaN       labevents        HEMATOLOGY   \n",
+       "51227         HEMOGLOBLIN S          NaN       labevents        HEMATOLOGY   \n",
+       "42232          THYMOGLOBLIN               inputevents_cv  Free Form Intake   \n",
+       "45486                  Hemo               inputevents_cv                     \n",
+       "42117         THYMOGLOBULIN               inputevents_cv  Free Form Intake   \n",
+       "50934                     H          NaN       labevents         CHEMISTRY   \n",
+       "\n",
+       "       unitname       score  \n",
+       "itemid                       \n",
+       "51222       NaN  110.000000  \n",
+       "220228     g/dl  110.000000  \n",
+       "814              110.000000  \n",
+       "1165             110.000000  \n",
+       "50811       NaN  110.000000  \n",
+       "51225       NaN  104.000000  \n",
+       "51224       NaN  104.000000  \n",
+       "50814       NaN  101.333333  \n",
+       "51223       NaN  101.333333  \n",
+       "7965              98.666667  \n",
+       "50852       NaN   96.666667  \n",
+       "51212       NaN   94.666667  \n",
+       "50805       NaN   92.666667  \n",
+       "50855       NaN   89.333333  \n",
+       "51226       NaN   88.000000  \n",
+       "51227       NaN   88.000000  \n",
+       "42232             81.333333  \n",
+       "45486             81.333333  \n",
+       "42117             78.666667  \n",
+       "50934       NaN   76.666667  "
+      ]
+     },
+     "execution_count": 107,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'hgb',\n",
+    "        'hemoglobin',\n",
+    "        'g/dL'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 108,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.HEMOGLOBIN] = [51222,220228,814,1165,50811]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Fluids\n",
+    "\n",
+    "### Normal Saline"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 109,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>41913</th>\n",
+       "      <td>NS</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6190</th>\n",
+       "      <td>Normal saline</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30143</th>\n",
+       "      <td>3% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>104.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30168</th>\n",
+       "      <td>Normal Saline_GU</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30160</th>\n",
+       "      <td>D5 Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30161</th>\n",
+       "      <td>.3% normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30018</th>\n",
+       "      <td>.9% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30020</th>\n",
+       "      <td>.45% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>101.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30176</th>\n",
+       "      <td>.25% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>101.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30352</th>\n",
+       "      <td>0.9% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220962</th>\n",
+       "      <td>Saline 3%</td>\n",
+       "      <td>Saline 3%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>98.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30353</th>\n",
+       "      <td>0.45% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>98.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44440</th>\n",
+       "      <td>Normal Saline Bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44053</th>\n",
+       "      <td>normal saline bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4647</th>\n",
+       "      <td>normal saline bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43354</th>\n",
+       "      <td>normal saline flushs</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>96.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221213</th>\n",
+       "      <td>Saline 30%</td>\n",
+       "      <td>Saline 30%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>95.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220959</th>\n",
+       "      <td>Saline 0,3%</td>\n",
+       "      <td>Saline 0,3%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>92.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220954</th>\n",
+       "      <td>Saline 0,9%</td>\n",
+       "      <td>Saline 0,9%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>92.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220960</th>\n",
+       "      <td>Saline 0,45%</td>\n",
+       "      <td>Saline 0,45%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>89.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                       label  abbreviation         linksto  \\\n",
+       "itemid                                                       \n",
+       "41913                     NS                inputevents_cv   \n",
+       "6190           Normal saline                   chartevents   \n",
+       "30143       3% Normal Saline                inputevents_cv   \n",
+       "30168       Normal Saline_GU                inputevents_cv   \n",
+       "30160       D5 Normal Saline                inputevents_cv   \n",
+       "30161      .3% normal Saline                inputevents_cv   \n",
+       "30018      .9% Normal Saline                inputevents_cv   \n",
+       "30020     .45% Normal Saline                inputevents_cv   \n",
+       "30176     .25% Normal Saline                inputevents_cv   \n",
+       "30352     0.9% Normal Saline                inputevents_cv   \n",
+       "220962             Saline 3%     Saline 3%  inputevents_mv   \n",
+       "30353    0.45% Normal Saline                inputevents_cv   \n",
+       "44440    Normal Saline Bolus                inputevents_cv   \n",
+       "44053    normal saline bolus                inputevents_cv   \n",
+       "4647     normal saline bolus                   chartevents   \n",
+       "43354   normal saline flushs                inputevents_cv   \n",
+       "221213            Saline 30%    Saline 30%  inputevents_mv   \n",
+       "220959           Saline 0,3%   Saline 0,3%  inputevents_mv   \n",
+       "220954           Saline 0,9%   Saline 0,9%  inputevents_mv   \n",
+       "220960          Saline 0,45%  Saline 0,45%  inputevents_mv   \n",
+       "\n",
+       "                           category unitname       score  \n",
+       "itemid                                                    \n",
+       "41913              Free Form Intake           110.000000  \n",
+       "6190                                          110.000000  \n",
+       "30143                                         104.333333  \n",
+       "30168                                         103.333333  \n",
+       "30160                                         103.333333  \n",
+       "30161                                         103.333333  \n",
+       "30018                                         103.333333  \n",
+       "30020                                         101.333333  \n",
+       "30176                                         101.333333  \n",
+       "30352                                         100.333333  \n",
+       "220962  Fluids - Other (Not In Use)       mL   98.666667  \n",
+       "30353                                          98.333333  \n",
+       "44440              Free Form Intake            97.333333  \n",
+       "44053              Free Form Intake            97.333333  \n",
+       "4647                                           97.333333  \n",
+       "43354              Free Form Intake            96.000000  \n",
+       "221213  Fluids - Other (Not In Use)       mL   95.000000  \n",
+       "220959  Fluids - Other (Not In Use)       mL   92.000000  \n",
+       "220954  Fluids - Other (Not In Use)       mL   92.000000  \n",
+       "220960  Fluids - Other (Not In Use)       mL   89.333333  "
+      ]
+     },
+     "execution_count": 109,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'saline',\n",
+    "        'NS',\n",
+    "        '0.9%',\n",
+    "        'normal saline'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 110,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.NORMAL_SALINE] = [41913,6190,20018,30252,44440,44053,4647,220954]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 111,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>41913</th>\n",
+       "      <td>NS</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6190</th>\n",
+       "      <td>Normal saline</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30143</th>\n",
+       "      <td>3% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>104.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30168</th>\n",
+       "      <td>Normal Saline_GU</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30160</th>\n",
+       "      <td>D5 Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30161</th>\n",
+       "      <td>.3% normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30018</th>\n",
+       "      <td>.9% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>103.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30020</th>\n",
+       "      <td>.45% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>101.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30176</th>\n",
+       "      <td>.25% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>101.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30352</th>\n",
+       "      <td>0.9% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>100.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220962</th>\n",
+       "      <td>Saline 3%</td>\n",
+       "      <td>Saline 3%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>98.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30353</th>\n",
+       "      <td>0.45% Normal Saline</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>98.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44440</th>\n",
+       "      <td>Normal Saline Bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44053</th>\n",
+       "      <td>normal saline bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4647</th>\n",
+       "      <td>normal saline bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>43354</th>\n",
+       "      <td>normal saline flushs</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>96.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221213</th>\n",
+       "      <td>Saline 30%</td>\n",
+       "      <td>Saline 30%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>95.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220959</th>\n",
+       "      <td>Saline 0,3%</td>\n",
+       "      <td>Saline 0,3%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>92.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220954</th>\n",
+       "      <td>Saline 0,9%</td>\n",
+       "      <td>Saline 0,9%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>92.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220960</th>\n",
+       "      <td>Saline 0,45%</td>\n",
+       "      <td>Saline 0,45%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>89.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220961</th>\n",
+       "      <td>Saline 0,65%</td>\n",
+       "      <td>Saline 0,65%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>89.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221212</th>\n",
+       "      <td>Saline 0,18%</td>\n",
+       "      <td>Saline 0,18%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>89.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>41392</th>\n",
+       "      <td>ns b</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225825</th>\n",
+       "      <td>D5NS</td>\n",
+       "      <td>D5NS</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5333</th>\n",
+       "      <td>saline flush</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30060</th>\n",
+       "      <td>D5NS</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>226401</th>\n",
+       "      <td>GU Irrigant - Normal Saline</td>\n",
+       "      <td>GU Irrigant - Normal Saline</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>87.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220958</th>\n",
+       "      <td>Saline 0,255%</td>\n",
+       "      <td>Saline 0,255%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>86.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2619</th>\n",
+       "      <td>3% NS</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>227344</th>\n",
+       "      <td>IV/Saline lock</td>\n",
+       "      <td>IV/Saline lock</td>\n",
+       "      <td></td>\n",
+       "      <td>Restraint/Support Systems</td>\n",
+       "      <td></td>\n",
+       "      <td>83.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30190</th>\n",
+       "      <td>NS .9%</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>82.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225158</th>\n",
+       "      <td>NaCl 0.9%</td>\n",
+       "      <td>NaCl 0.9%</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>82.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45298</th>\n",
+       "      <td>ED NS</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2072</th>\n",
+       "      <td>Pinsp</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2107</th>\n",
+       "      <td>pinsp</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7092</th>\n",
+       "      <td>Tinsp</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6384</th>\n",
+       "      <td>PINSP</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44498</th>\n",
+       "      <td>er ns</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3204</th>\n",
+       "      <td>Pinsp.</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2404</th>\n",
+       "      <td>.45%ns</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>79.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                              label                 abbreviation  \\\n",
+       "itemid                                                             \n",
+       "41913                            NS                                \n",
+       "6190                  Normal saline                                \n",
+       "30143              3% Normal Saline                                \n",
+       "30168              Normal Saline_GU                                \n",
+       "30160              D5 Normal Saline                                \n",
+       "30161             .3% normal Saline                                \n",
+       "30018             .9% Normal Saline                                \n",
+       "30020            .45% Normal Saline                                \n",
+       "30176            .25% Normal Saline                                \n",
+       "30352            0.9% Normal Saline                                \n",
+       "220962                    Saline 3%                    Saline 3%   \n",
+       "30353           0.45% Normal Saline                                \n",
+       "44440           Normal Saline Bolus                                \n",
+       "44053           normal saline bolus                                \n",
+       "4647            normal saline bolus                                \n",
+       "43354          normal saline flushs                                \n",
+       "221213                   Saline 30%                   Saline 30%   \n",
+       "220959                  Saline 0,3%                  Saline 0,3%   \n",
+       "220954                  Saline 0,9%                  Saline 0,9%   \n",
+       "220960                 Saline 0,45%                 Saline 0,45%   \n",
+       "220961                 Saline 0,65%                 Saline 0,65%   \n",
+       "221212                 Saline 0,18%                 Saline 0,18%   \n",
+       "41392                          ns b                                \n",
+       "225825                         D5NS                         D5NS   \n",
+       "5333                   saline flush                                \n",
+       "30060                          D5NS                                \n",
+       "226401  GU Irrigant - Normal Saline  GU Irrigant - Normal Saline   \n",
+       "220958                Saline 0,255%                Saline 0,255%   \n",
+       "2619                          3% NS                                \n",
+       "227344               IV/Saline lock               IV/Saline lock   \n",
+       "30190                        NS .9%                                \n",
+       "225158                    NaCl 0.9%                    NaCl 0.9%   \n",
+       "45298                         ED NS                                \n",
+       "2072                          Pinsp                                \n",
+       "2107                          pinsp                                \n",
+       "7092                          Tinsp                                \n",
+       "6384                          PINSP                                \n",
+       "44498                         er ns                                \n",
+       "3204                         Pinsp.                                \n",
+       "2404                         .45%ns                                \n",
+       "\n",
+       "               linksto                     category unitname       score  \n",
+       "itemid                                                                    \n",
+       "41913   inputevents_cv             Free Form Intake           110.000000  \n",
+       "6190       chartevents                                        110.000000  \n",
+       "30143   inputevents_cv                                        104.333333  \n",
+       "30168   inputevents_cv                                        103.333333  \n",
+       "30160   inputevents_cv                                        103.333333  \n",
+       "30161   inputevents_cv                                        103.333333  \n",
+       "30018   inputevents_cv                                        103.333333  \n",
+       "30020   inputevents_cv                                        101.333333  \n",
+       "30176   inputevents_cv                                        101.333333  \n",
+       "30352   inputevents_cv                                        100.333333  \n",
+       "220962  inputevents_mv  Fluids - Other (Not In Use)       mL   98.666667  \n",
+       "30353   inputevents_cv                                         98.333333  \n",
+       "44440   inputevents_cv             Free Form Intake            97.333333  \n",
+       "44053   inputevents_cv             Free Form Intake            97.333333  \n",
+       "4647       chartevents                                         97.333333  \n",
+       "43354   inputevents_cv             Free Form Intake            96.000000  \n",
+       "221213  inputevents_mv  Fluids - Other (Not In Use)       mL   95.000000  \n",
+       "220959  inputevents_mv  Fluids - Other (Not In Use)       mL   92.000000  \n",
+       "220954  inputevents_mv  Fluids - Other (Not In Use)       mL   92.000000  \n",
+       "220960  inputevents_mv  Fluids - Other (Not In Use)       mL   89.333333  \n",
+       "220961  inputevents_mv  Fluids - Other (Not In Use)       mL   89.333333  \n",
+       "221212  inputevents_mv  Fluids - Other (Not In Use)       mL   89.333333  \n",
+       "41392   inputevents_cv             Free Form Intake            88.000000  \n",
+       "225825  inputevents_mv                Fluids/Intake       mL   88.000000  \n",
+       "5333       chartevents                                         88.000000  \n",
+       "30060   inputevents_cv                                         88.000000  \n",
+       "226401  inputevents_mv                Fluids/Intake       mL   87.666667  \n",
+       "220958  inputevents_mv  Fluids - Other (Not In Use)       mL   86.666667  \n",
+       "2619       chartevents                                         84.666667  \n",
+       "227344                    Restraint/Support Systems            83.333333  \n",
+       "30190   inputevents_cv                                         82.333333  \n",
+       "225158  inputevents_mv                Fluids/Intake       mL   82.333333  \n",
+       "45298   inputevents_cv             Free Form Intake            81.333333  \n",
+       "2072       chartevents                                         81.333333  \n",
+       "2107       chartevents                                         81.333333  \n",
+       "7092       chartevents                                         81.333333  \n",
+       "6384       chartevents                                         81.333333  \n",
+       "44498   inputevents_cv             Free Form Intake            81.333333  \n",
+       "3204       chartevents                                         79.000000  \n",
+       "2404       chartevents                                         79.000000  "
+      ]
+     },
+     "execution_count": 111,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df.head(40)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 112,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.NORMAL_SALINE] += [30190,225158]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Lactated Ringers"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 113,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>225828</th>\n",
+       "      <td>LR</td>\n",
+       "      <td>LR</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44367</th>\n",
+       "      <td>LR</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2971</th>\n",
+       "      <td>LR</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1634</th>\n",
+       "      <td>lactated ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30021</th>\n",
+       "      <td>Lactated Ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45532</th>\n",
+       "      <td>IR Lactated ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>104.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225943</th>\n",
+       "      <td>Solution</td>\n",
+       "      <td>Solution</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225827</th>\n",
+       "      <td>D5LR</td>\n",
+       "      <td>D5LR</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50813</th>\n",
+       "      <td>LACTATE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220953</th>\n",
+       "      <td>Ringers</td>\n",
+       "      <td>Ringers</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46207</th>\n",
+       "      <td>OR LR</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44184</th>\n",
+       "      <td>LR Bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44521</th>\n",
+       "      <td>LR bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46781</th>\n",
+       "      <td>lr bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44815</th>\n",
+       "      <td>LR BOLUS</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44915</th>\n",
+       "      <td>D5LR 40K</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46538</th>\n",
+       "      <td>PD solution in</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>68.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44837</th>\n",
+       "      <td>ED URINE</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>68.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8313</th>\n",
+       "      <td>Nystatin solution</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30125</th>\n",
+       "      <td>Milrinone</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                      label abbreviation         linksto  \\\n",
+       "itemid                                                     \n",
+       "225828                   LR           LR  inputevents_mv   \n",
+       "44367                    LR               inputevents_cv   \n",
+       "2971                     LR                  chartevents   \n",
+       "1634       lactated ringers                  chartevents   \n",
+       "30021      Lactated Ringers               inputevents_cv   \n",
+       "45532   IR Lactated ringers               inputevents_cv   \n",
+       "225943             Solution     Solution  inputevents_mv   \n",
+       "225827                 D5LR         D5LR  inputevents_mv   \n",
+       "50813               LACTATE          NaN       labevents   \n",
+       "220953              Ringers      Ringers  inputevents_mv   \n",
+       "46207                 OR LR               inputevents_cv   \n",
+       "44184              LR Bolus               inputevents_cv   \n",
+       "44521              LR bolus               inputevents_cv   \n",
+       "46781              lr bolus               inputevents_cv   \n",
+       "44815              LR BOLUS               inputevents_cv   \n",
+       "44915              D5LR 40K               inputevents_cv   \n",
+       "46538        PD solution in               inputevents_cv   \n",
+       "44837              ED URINE                 outputevents   \n",
+       "8313      Nystatin solution                  chartevents   \n",
+       "30125             Milrinone               inputevents_cv   \n",
+       "\n",
+       "                           category unitname       score  \n",
+       "itemid                                                    \n",
+       "225828                Fluids/Intake       mL  110.000000  \n",
+       "44367              Free Form Intake           110.000000  \n",
+       "2971                                          110.000000  \n",
+       "1634                                          110.000000  \n",
+       "30021                                         110.000000  \n",
+       "45532              Free Form Intake           104.000000  \n",
+       "225943                Fluids/Intake       mL   88.000000  \n",
+       "225827                Fluids/Intake       mL   88.000000  \n",
+       "50813                     BLOOD GAS      NaN   84.000000  \n",
+       "220953  Fluids - Other (Not In Use)       mL   84.000000  \n",
+       "46207              Free Form Intake            81.333333  \n",
+       "44184              Free Form Intake            70.000000  \n",
+       "44521              Free Form Intake            70.000000  \n",
+       "46781              Free Form Intake            70.000000  \n",
+       "44815              Free Form Intake            70.000000  \n",
+       "44915              Free Form Intake            70.000000  \n",
+       "46538              Free Form Intake            68.333333  \n",
+       "44837                                          68.000000  \n",
+       "8313                                           67.666667  \n",
+       "30125                                          67.333333  "
+      ]
+     },
+     "execution_count": 113,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'LR',\n",
+    "        'ringers solution',\n",
+    "        'lactated ringers'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 114,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>225828</th>\n",
+       "      <td>LR</td>\n",
+       "      <td>LR</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44367</th>\n",
+       "      <td>LR</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2971</th>\n",
+       "      <td>LR</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1634</th>\n",
+       "      <td>lactated ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30021</th>\n",
+       "      <td>Lactated Ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45532</th>\n",
+       "      <td>IR Lactated ringers</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>104.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225943</th>\n",
+       "      <td>Solution</td>\n",
+       "      <td>Solution</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225827</th>\n",
+       "      <td>D5LR</td>\n",
+       "      <td>D5LR</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids/Intake</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>88.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50813</th>\n",
+       "      <td>LACTATE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220953</th>\n",
+       "      <td>Ringers</td>\n",
+       "      <td>Ringers</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>84.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46207</th>\n",
+       "      <td>OR LR</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>81.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44184</th>\n",
+       "      <td>LR Bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44521</th>\n",
+       "      <td>LR bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46781</th>\n",
+       "      <td>lr bolus</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44815</th>\n",
+       "      <td>LR BOLUS</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44915</th>\n",
+       "      <td>D5LR 40K</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46538</th>\n",
+       "      <td>PD solution in</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>68.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44837</th>\n",
+       "      <td>ED URINE</td>\n",
+       "      <td></td>\n",
+       "      <td>outputevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>68.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8313</th>\n",
+       "      <td>Nystatin solution</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30125</th>\n",
+       "      <td>Milrinone</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221986</th>\n",
+       "      <td>Milrinone</td>\n",
+       "      <td>Milrinone</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>67.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30159</th>\n",
+       "      <td>D5 Ringers Lact.</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>67.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228159</th>\n",
+       "      <td>Purge Solution Flow Rate</td>\n",
+       "      <td>Purge Solution Flow Rate</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Impella</td>\n",
+       "      <td>ml/hr</td>\n",
+       "      <td>66.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225953</th>\n",
+       "      <td>Solution (Peritoneal Dialysis)</td>\n",
+       "      <td>Solution (PD)</td>\n",
+       "      <td></td>\n",
+       "      <td>Dialysis</td>\n",
+       "      <td></td>\n",
+       "      <td>66.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45983</th>\n",
+       "      <td>Pitocin/LR</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>65.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42409</th>\n",
+       "      <td>D5LR W/40K</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>65.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42978</th>\n",
+       "      <td>D5LR 20KCL</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>65.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1189</th>\n",
+       "      <td>finger stick</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>65.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5743</th>\n",
+       "      <td>NT suction</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>64.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1520</th>\n",
+       "      <td>ACT</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Coags</td>\n",
+       "      <td></td>\n",
+       "      <td>64.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220507</th>\n",
+       "      <td>Activated Clotting Time</td>\n",
+       "      <td>ACT</td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td>Labs</td>\n",
+       "      <td>None</td>\n",
+       "      <td>64.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1671</th>\n",
+       "      <td>act</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>64.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8339</th>\n",
+       "      <td>Neo Opium Solution</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>64.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42288</th>\n",
+       "      <td>LR w/40 kcl</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>64.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225072</th>\n",
+       "      <td>Living situation</td>\n",
+       "      <td>Living situation</td>\n",
+       "      <td></td>\n",
+       "      <td>Adm History/FHPA</td>\n",
+       "      <td></td>\n",
+       "      <td>63.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42345</th>\n",
+       "      <td>LR w/ 40 mEq</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2773</th>\n",
+       "      <td>sjlactate</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5088</th>\n",
+       "      <td>fingers</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42265</th>\n",
+       "      <td>LR W/ 20 KCL</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>63.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>220955</th>\n",
+       "      <td>Ringers Lactate</td>\n",
+       "      <td>Ringers Lactate</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Fluids - Other (Not In Use)</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>63.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                 label              abbreviation  \\\n",
+       "itemid                                                             \n",
+       "225828                              LR                        LR   \n",
+       "44367                               LR                             \n",
+       "2971                                LR                             \n",
+       "1634                  lactated ringers                             \n",
+       "30021                 Lactated Ringers                             \n",
+       "45532              IR Lactated ringers                             \n",
+       "225943                        Solution                  Solution   \n",
+       "225827                            D5LR                      D5LR   \n",
+       "50813                          LACTATE                       NaN   \n",
+       "220953                         Ringers                   Ringers   \n",
+       "46207                            OR LR                             \n",
+       "44184                         LR Bolus                             \n",
+       "44521                         LR bolus                             \n",
+       "46781                         lr bolus                             \n",
+       "44815                         LR BOLUS                             \n",
+       "44915                         D5LR 40K                             \n",
+       "46538                   PD solution in                             \n",
+       "44837                         ED URINE                             \n",
+       "8313                 Nystatin solution                             \n",
+       "30125                        Milrinone                             \n",
+       "221986                       Milrinone                 Milrinone   \n",
+       "30159                 D5 Ringers Lact.                             \n",
+       "228159        Purge Solution Flow Rate  Purge Solution Flow Rate   \n",
+       "225953  Solution (Peritoneal Dialysis)             Solution (PD)   \n",
+       "45983                       Pitocin/LR                             \n",
+       "42409                       D5LR W/40K                             \n",
+       "42978                       D5LR 20KCL                             \n",
+       "1189                      finger stick                             \n",
+       "5743                        NT suction                             \n",
+       "1520                               ACT                             \n",
+       "220507         Activated Clotting Time                       ACT   \n",
+       "1671                               act                             \n",
+       "8339                Neo Opium Solution                             \n",
+       "42288                      LR w/40 kcl                             \n",
+       "225072                Living situation          Living situation   \n",
+       "42345                     LR w/ 40 mEq                             \n",
+       "2773                         sjlactate                             \n",
+       "5088                           fingers                             \n",
+       "42265                     LR W/ 20 KCL                             \n",
+       "220955                 Ringers Lactate           Ringers Lactate   \n",
+       "\n",
+       "               linksto                     category unitname       score  \n",
+       "itemid                                                                    \n",
+       "225828  inputevents_mv                Fluids/Intake       mL  110.000000  \n",
+       "44367   inputevents_cv             Free Form Intake           110.000000  \n",
+       "2971       chartevents                                        110.000000  \n",
+       "1634       chartevents                                        110.000000  \n",
+       "30021   inputevents_cv                                        110.000000  \n",
+       "45532   inputevents_cv             Free Form Intake           104.000000  \n",
+       "225943  inputevents_mv                Fluids/Intake       mL   88.000000  \n",
+       "225827  inputevents_mv                Fluids/Intake       mL   88.000000  \n",
+       "50813        labevents                    BLOOD GAS      NaN   84.000000  \n",
+       "220953  inputevents_mv  Fluids - Other (Not In Use)       mL   84.000000  \n",
+       "46207   inputevents_cv             Free Form Intake            81.333333  \n",
+       "44184   inputevents_cv             Free Form Intake            70.000000  \n",
+       "44521   inputevents_cv             Free Form Intake            70.000000  \n",
+       "46781   inputevents_cv             Free Form Intake            70.000000  \n",
+       "44815   inputevents_cv             Free Form Intake            70.000000  \n",
+       "44915   inputevents_cv             Free Form Intake            70.000000  \n",
+       "46538   inputevents_cv             Free Form Intake            68.333333  \n",
+       "44837     outputevents                                         68.000000  \n",
+       "8313       chartevents                                         67.666667  \n",
+       "30125   inputevents_cv                                         67.333333  \n",
+       "221986  inputevents_mv                  Medications       mg   67.333333  \n",
+       "30159   inputevents_cv                                         67.333333  \n",
+       "228159     chartevents                      Impella    ml/hr   66.666667  \n",
+       "225953                                     Dialysis            66.000000  \n",
+       "45983   inputevents_cv             Free Form Intake            65.333333  \n",
+       "42409   inputevents_cv             Free Form Intake            65.333333  \n",
+       "42978   inputevents_cv             Free Form Intake            65.333333  \n",
+       "1189       chartevents                                         65.000000  \n",
+       "5743       chartevents                                         64.666667  \n",
+       "1520       chartevents                        Coags            64.666667  \n",
+       "220507     chartevents                         Labs     None   64.666667  \n",
+       "1671       chartevents                                         64.666667  \n",
+       "8339       chartevents                                         64.333333  \n",
+       "42288   inputevents_cv             Free Form Intake            64.000000  \n",
+       "225072                             Adm History/FHPA            63.666667  \n",
+       "42345   inputevents_cv             Free Form Intake            63.333333  \n",
+       "2773       chartevents                                         63.333333  \n",
+       "5088       chartevents                                         63.333333  \n",
+       "42265   inputevents_cv             Free Form Intake            63.333333  \n",
+       "220955  inputevents_mv  Fluids - Other (Not In Use)       mL   63.000000  "
+      ]
+     },
+     "execution_count": 114,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df.head(40)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 115,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.LACTATED_RINGERS] = [225828,44367,2971,1634,30021,220953,46207,44184,44521,46781,44815]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Pressors"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Norepinephrine"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 117,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>30047</th>\n",
+       "      <td>Levophed</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221906</th>\n",
+       "      <td>Norepinephrine</td>\n",
+       "      <td>Norepinephrine</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30120</th>\n",
+       "      <td>Levophed-k</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>102.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30044</th>\n",
+       "      <td>Epinephrine</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>102.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>221289</th>\n",
+       "      <td>Epinephrine</td>\n",
+       "      <td>Epinephrine</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>102.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5752</th>\n",
+       "      <td>Epinephrin</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>98.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51201</th>\n",
+       "      <td>EPINEPHERINE</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>88.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30119</th>\n",
+       "      <td>Epinephrine-k</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>84.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30309</th>\n",
+       "      <td>Epinephrine Drip</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>77.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30127</th>\n",
+       "      <td>Neosynephrine</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>72.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>225922</th>\n",
+       "      <td>Nephramine</td>\n",
+       "      <td>Nephramine</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Nutrition - Supplements</td>\n",
+       "      <td>mL</td>\n",
+       "      <td>71.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3112</th>\n",
+       "      <td>epinephrine mcg/min</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>71.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50820</th>\n",
+       "      <td>PH</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51491</th>\n",
+       "      <td>PH</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>HEMATOLOGY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>51094</th>\n",
+       "      <td>PH</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>CHEMISTRY</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50831</th>\n",
+       "      <td>PH</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>labevents</td>\n",
+       "      <td>BLOOD GAS</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45183</th>\n",
+       "      <td>ED</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7459</th>\n",
+       "      <td>Ph</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1673</th>\n",
+       "      <td>PH</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>70.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>30128</th>\n",
+       "      <td>Neosynephrine-k</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>69.666667</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                      label    abbreviation         linksto  \\\n",
+       "itemid                                                        \n",
+       "30047              Levophed                  inputevents_cv   \n",
+       "221906       Norepinephrine  Norepinephrine  inputevents_mv   \n",
+       "30120            Levophed-k                  inputevents_cv   \n",
+       "30044           Epinephrine                  inputevents_cv   \n",
+       "221289          Epinephrine     Epinephrine  inputevents_mv   \n",
+       "5752             Epinephrin                     chartevents   \n",
+       "51201          EPINEPHERINE             NaN       labevents   \n",
+       "30119         Epinephrine-k                  inputevents_cv   \n",
+       "30309      Epinephrine Drip                  inputevents_cv   \n",
+       "30127         Neosynephrine                  inputevents_cv   \n",
+       "225922           Nephramine      Nephramine  inputevents_mv   \n",
+       "3112    epinephrine mcg/min                     chartevents   \n",
+       "50820                    PH             NaN       labevents   \n",
+       "51491                    PH             NaN       labevents   \n",
+       "51094                    PH             NaN       labevents   \n",
+       "50831                    PH             NaN       labevents   \n",
+       "45183                    ED                  inputevents_cv   \n",
+       "7459                     Ph                     chartevents   \n",
+       "1673                     PH                     chartevents   \n",
+       "30128       Neosynephrine-k                  inputevents_cv   \n",
+       "\n",
+       "                       category unitname       score  \n",
+       "itemid                                                \n",
+       "30047                                     110.000000  \n",
+       "221906              Medications       mg  110.000000  \n",
+       "30120                                     102.666667  \n",
+       "30044                                     102.000000  \n",
+       "221289              Medications       mg  102.000000  \n",
+       "5752                                       98.666667  \n",
+       "51201                HEMATOLOGY      NaN   88.666667  \n",
+       "30119                                      84.666667  \n",
+       "30309                                      77.333333  \n",
+       "30127                                      72.333333  \n",
+       "225922  Nutrition - Supplements       mL   71.333333  \n",
+       "3112                                       71.000000  \n",
+       "50820                 BLOOD GAS      NaN   70.000000  \n",
+       "51491                HEMATOLOGY      NaN   70.000000  \n",
+       "51094                 CHEMISTRY      NaN   70.000000  \n",
+       "50831                 BLOOD GAS      NaN   70.000000  \n",
+       "45183          Free Form Intake            70.000000  \n",
+       "7459                                       70.000000  \n",
+       "1673                                       70.000000  \n",
+       "30128                                      69.666667  "
+      ]
+     },
+     "execution_count": 117,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'levophed',\n",
+    "        'norepinephrine'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 118,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.NOREPINEPHRINE] = [30047,221906,30120]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Vasopressin"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 119,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>abbreviation</th>\n",
+       "      <th>linksto</th>\n",
+       "      <th>category</th>\n",
+       "      <th>unitname</th>\n",
+       "      <th>score</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>itemid</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>30051</th>\n",
+       "      <td>Vasopressin</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2445</th>\n",
+       "      <td>Vasopressin</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>222315</th>\n",
+       "      <td>Vasopressin</td>\n",
+       "      <td>Vasopressin</td>\n",
+       "      <td>inputevents_mv</td>\n",
+       "      <td>Medications</td>\n",
+       "      <td>units</td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1136</th>\n",
+       "      <td>vasopressin</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1222</th>\n",
+       "      <td>VASOPRESSIN</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>110.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2334</th>\n",
+       "      <td>vasopressin u/hr</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2561</th>\n",
+       "      <td>VASOPRESSIN U/HR</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>97.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7341</th>\n",
+       "      <td>Vasopressin  u/hr</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>96.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46570</th>\n",
+       "      <td>vassopressin</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>94.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42802</th>\n",
+       "      <td>VASOPRESSIN  CC/HR.</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>94.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6255</th>\n",
+       "      <td>VAsopressin 0.04   s</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>92.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2765</th>\n",
+       "      <td>VASOPRESSIN   UNIT/R</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>92.333333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2248</th>\n",
+       "      <td>VASOPRESSIN UNIT/MIN</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>42273</th>\n",
+       "      <td>vasopressin unit/min</td>\n",
+       "      <td></td>\n",
+       "      <td>inputevents_cv</td>\n",
+       "      <td>Free Form Intake</td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1327</th>\n",
+       "      <td>vasopressin unit/min</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>90.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6269</th>\n",
+       "      <td>Dressing</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>68.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>46</th>\n",
+       "      <td>Angio Dressing #2</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>68.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6691</th>\n",
+       "      <td>DRIV PRESS</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>68.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>45</th>\n",
+       "      <td>Angio Dressing #1</td>\n",
+       "      <td></td>\n",
+       "      <td>chartevents</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>68.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>228448</th>\n",
+       "      <td>Angio Dressing # 4</td>\n",
+       "      <td>Angio Dressing # 4</td>\n",
+       "      <td></td>\n",
+       "      <td>Cardiovascular</td>\n",
+       "      <td></td>\n",
+       "      <td>67.333333</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                       label        abbreviation         linksto  \\\n",
+       "itemid                                                             \n",
+       "30051            Vasopressin                      inputevents_cv   \n",
+       "2445             Vasopressin                         chartevents   \n",
+       "222315           Vasopressin         Vasopressin  inputevents_mv   \n",
+       "1136             vasopressin                         chartevents   \n",
+       "1222             VASOPRESSIN                         chartevents   \n",
+       "2334        vasopressin u/hr                         chartevents   \n",
+       "2561        VASOPRESSIN U/HR                         chartevents   \n",
+       "7341       Vasopressin  u/hr                         chartevents   \n",
+       "46570           vassopressin                      inputevents_cv   \n",
+       "42802    VASOPRESSIN  CC/HR.                      inputevents_cv   \n",
+       "6255    VAsopressin 0.04   s                         chartevents   \n",
+       "2765    VASOPRESSIN   UNIT/R                         chartevents   \n",
+       "2248    VASOPRESSIN UNIT/MIN                         chartevents   \n",
+       "42273   vasopressin unit/min                      inputevents_cv   \n",
+       "1327    vasopressin unit/min                         chartevents   \n",
+       "6269                Dressing                         chartevents   \n",
+       "46         Angio Dressing #2                         chartevents   \n",
+       "6691              DRIV PRESS                         chartevents   \n",
+       "45         Angio Dressing #1                         chartevents   \n",
+       "228448    Angio Dressing # 4  Angio Dressing # 4                   \n",
+       "\n",
+       "                category unitname       score  \n",
+       "itemid                                         \n",
+       "30051                              110.000000  \n",
+       "2445                               110.000000  \n",
+       "222315       Medications    units  110.000000  \n",
+       "1136                               110.000000  \n",
+       "1222                               110.000000  \n",
+       "2334                                97.333333  \n",
+       "2561                                97.333333  \n",
+       "7341                                96.666667  \n",
+       "46570   Free Form Intake            94.333333  \n",
+       "42802   Free Form Intake            94.000000  \n",
+       "6255                                92.333333  \n",
+       "2765                                92.333333  \n",
+       "2248                                90.666667  \n",
+       "42273   Free Form Intake            90.666667  \n",
+       "1327                                90.666667  \n",
+       "6269                                68.666667  \n",
+       "46                                  68.000000  \n",
+       "6691                                68.000000  \n",
+       "45                                  68.000000  \n",
+       "228448    Cardiovascular            67.333333  "
+      ]
+     },
+     "execution_count": 119,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out_df = explorer.search([\n",
+    "        'vasopressin',\n",
+    "        'argipressin',\n",
+    "        'arginine vasopressin'\n",
+    "    ])\n",
+    "out_df.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 120,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "keep_dict[data_dict.labels.VASOPRESSIN] = out_df.loc[:1327].index.tolist()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Now build our mapping dataframe"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 124,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "from itertools import product"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 131,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "tuples = []\n",
+    "\n",
+    "for label,items in keep_dict.iteritems():\n",
+    "    tuples += list(product([label],items))\n",
+    "\n",
+    "item_map = pd.DataFrame(tuples,columns=['label','itemid'])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 132,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>glasgow coma scale eye opening</td>\n",
+       "      <td>184</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>glasgow coma scale eye opening</td>\n",
+       "      <td>220739</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>glasgow coma scale motor</td>\n",
+       "      <td>454</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>glasgow coma scale motor</td>\n",
+       "      <td>223901</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>blood pressure systolic</td>\n",
+       "      <td>220179</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                            label  itemid\n",
+       "0  glasgow coma scale eye opening     184\n",
+       "1  glasgow coma scale eye opening  220739\n",
+       "2        glasgow coma scale motor     454\n",
+       "3        glasgow coma scale motor  223901\n",
+       "4         blood pressure systolic  220179"
+      ]
+     },
+     "execution_count": 132,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "item_map.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 133,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "item_map.to_csv('config/mimic_item_map.csv',index=False)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Extract MIMIC III data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "import mimic\n",
+    "from constants import ALL\n",
+    "import icu_data_defs \n",
+    "import utils\n",
+    "import logger\n",
+    "import warnings\n",
+    "warnings.filterwarnings('ignore')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(icu_data_defs)\n",
+    "reload(mimic)\n",
+    "reload(logger)\n",
+    "\n",
+    "def extract_labels(conn,labels,item_map_fname,hdf5_fname,hadm_ids=ALL):\n",
+    "    logger.log('Start extracting {} labels'.format(len(labels)),new_level=True)\n",
+    "    extractor = mimic.mimic_extractor(conn,item_map_fname)\n",
+    "    for label in labels:\n",
+    "        logger.log(label.upper(),new_level=True)\n",
+    "        df = extractor.extract_label(label,hadm_ids)\n",
+    "        if df is None: continue\n",
+    "        utils.save_df(df,hdf5_fname,'extract/{}'.format(label))\n",
+    "        display(df.head())\n",
+    "        print df.shape\n",
+    "        del df\n",
+    "    logger.end_log()\n",
+    "    return \n",
+    "\n",
+    "#connect to the mimic database\n",
+    "conn = mimic.connect()\n",
+    "\n",
+    "#these are the default config files we will be using\n",
+    "item_map_fname = 'config/mimic_item_map.csv'\n",
+    "mimic_data_sef_fname = 'config/data_definitions.xlsx'\n",
+    "\n",
+    "#get all labels\n",
+    "data_dict = icu_data_defs.data_dictionary(mimic_data_sef_fname)\n",
+    "simple_data = data_dict.get_panel_defintions(12) #12 is \"simple data\"\n",
+    "labels = simple_data.label.unique().tolist()\n",
+    "\n",
+    "#where we will be storing this extraction\n",
+    "hdf5_fname = 'data/mimic_data'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 03:26:58) Start extracting 5 labels\n",
+      "(2017-06-03 03:26:58)>> HEART RATE\n",
+      "(2017-06-03 03:26:59)>>>> Extracting 5 items from chartevents\n",
+      "(2017-06-03 03:26:59)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:26:59)>>>> Combine DF\n",
+      "(2017-06-03 03:26:59)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:26:59)>>>> Clean UOM\n",
+      "(2017-06-03 03:26:59)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 00:00:00</td>\n",
+       "      <td>62</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 00:30:00</td>\n",
+       "      <td>67</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 01:00:00</td>\n",
+       "      <td>67</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 01:20:00</td>\n",
+       "      <td>63</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 01:25:00</td>\n",
+       "      <td>63</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value     units  itemid\n",
+       "0  143838 2129-07-14 00:00:00    62  beat/min     211\n",
+       "1  143838 2129-07-14 00:30:00    67  beat/min     211\n",
+       "2  143838 2129-07-14 01:00:00    67  beat/min     211\n",
+       "3  143838 2129-07-14 01:20:00    63  beat/min     211\n",
+       "4  143838 2129-07-14 01:25:00    63  beat/min     211"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(1649, 5)\n",
+      "(2017-06-03 03:27:01)<< DONE (3.0s)\n",
+      "(2017-06-03 03:27:01)>> BLOOD PRESSURE SYSTOLIC\n",
+      "(2017-06-03 03:27:01)>>>> Extracting 14 items from chartevents\n",
+      "(2017-06-03 03:27:02)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:27:02)>>>> Combine DF\n",
+      "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:02)>>>> Clean UOM\n",
+      "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-13 22:40:00</td>\n",
+       "      <td>145</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-13 23:00:00</td>\n",
+       "      <td>136</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-13 23:30:00</td>\n",
+       "      <td>179</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 00:00:00</td>\n",
+       "      <td>131</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 00:30:00</td>\n",
+       "      <td>146</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value units  itemid\n",
+       "0  143838 2129-07-13 22:40:00   145  mmHg      51\n",
+       "1  143838 2129-07-13 23:00:00   136  mmHg      51\n",
+       "2  143838 2129-07-13 23:30:00   179  mmHg      51\n",
+       "3  143838 2129-07-14 00:00:00   131  mmHg      51\n",
+       "4  143838 2129-07-14 00:30:00   146  mmHg      51"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(644, 5)\n",
+      "(2017-06-03 03:27:02)<< DONE (1.0s)\n",
+      "(2017-06-03 03:27:02)>> BLOOD PRESSURE DIASTOLIC\n",
+      "(2017-06-03 03:27:02)>>>> Extracting 15 items from chartevents\n",
+      "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:02)>>>> Combine DF\n",
+      "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:02)>>>> Clean UOM\n",
+      "(2017-06-03 03:27:02)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 21:00:00</td>\n",
+       "      <td>53</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 14:00:00</td>\n",
+       "      <td>84</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 10:30:00</td>\n",
+       "      <td>54</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 15:00:00</td>\n",
+       "      <td>60</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 16:00:00</td>\n",
+       "      <td>59</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value units  itemid\n",
+       "0  113540 2161-10-12 21:00:00    53  mmHg  220051\n",
+       "1  113540 2161-10-12 14:00:00    84  mmHg  220051\n",
+       "2  113540 2161-10-12 10:30:00    54  mmHg  220051\n",
+       "3  113540 2161-10-12 15:00:00    60  mmHg  220051\n",
+       "4  113540 2161-10-12 16:00:00    59  mmHg  220051"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(640, 5)\n",
+      "(2017-06-03 03:27:02)<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:02)>> BLOOD PRESSURE MEAN\n",
+      "(2017-06-03 03:27:03)>>>> Extracting 3 items from chartevents\n",
+      "(2017-06-03 03:27:03)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:03)>>>> Combine DF\n",
+      "(2017-06-03 03:27:03)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:03)>>>> Clean UOM\n",
+      "(2017-06-03 03:27:03)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 21:00:00</td>\n",
+       "      <td>76</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 12:00:00</td>\n",
+       "      <td>91</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 14:00:00</td>\n",
+       "      <td>82</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 10:30:00</td>\n",
+       "      <td>70</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>113540</td>\n",
+       "      <td>2161-10-12 15:00:00</td>\n",
+       "      <td>80</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value units  itemid\n",
+       "0  113540 2161-10-12 21:00:00    76  mmHg  220052\n",
+       "1  113540 2161-10-12 12:00:00    91  mmHg  220052\n",
+       "2  113540 2161-10-12 14:00:00    82  mmHg  220052\n",
+       "3  113540 2161-10-12 10:30:00    70  mmHg  220052\n",
+       "4  113540 2161-10-12 15:00:00    80  mmHg  220052"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(58, 5)\n",
+      "(2017-06-03 03:27:03)<< DONE (1.0s)\n",
+      "(2017-06-03 03:27:03)>> RESPIRATORY RATE\n",
+      "(2017-06-03 03:27:03)>>>> Extracting 4 items from chartevents\n",
+      "(2017-06-03 03:27:04)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:27:04)>>>> Combine DF\n",
+      "(2017-06-03 03:27:04)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:27:04)>>>> Clean UOM\n",
+      "(2017-06-03 03:27:04)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-13 23:30:00</td>\n",
+       "      <td>17</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 00:00:00</td>\n",
+       "      <td>20</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 00:30:00</td>\n",
+       "      <td>17</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 01:00:00</td>\n",
+       "      <td>13</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>143838</td>\n",
+       "      <td>2129-07-14 01:20:00</td>\n",
+       "      <td>15</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value       units  itemid\n",
+       "0  143838 2129-07-13 23:30:00    17  breath/min     618\n",
+       "1  143838 2129-07-14 00:00:00    20  breath/min     618\n",
+       "2  143838 2129-07-14 00:30:00    17  breath/min     618\n",
+       "3  143838 2129-07-14 01:00:00    13  breath/min     618\n",
+       "4  143838 2129-07-14 01:20:00    15  breath/min     618"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(1647, 5)\n",
+      "(2017-06-03 03:27:04)<< DONE (1.0s)\n",
+      "(2017-06-03 03:27:04) DONE (6.0s)\n"
+     ]
+    }
+   ],
+   "source": [
+    "hadm_ids = mimic.sample_hadm_ids(5,conn)\n",
+    "extract_labels(conn,labels[0:5],item_map_fname,hdf5_fname,hadm_ids)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 03:27:10) Start extracting 18 labels\n",
+      "(2017-06-03 03:27:10)>> HEART RATE\n",
+      "(2017-06-03 03:27:10)>>>> Extracting 5 items from chartevents\n",
+      "(2017-06-03 03:28:03)<<<< DONE (53.0s)\n",
+      "(2017-06-03 03:28:03)>>>> Combine DF\n",
+      "(2017-06-03 03:28:03)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:28:03)>>>> Clean UOM\n",
+      "(2017-06-03 03:28:07)<<<< DONE (4.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-26 03:00:00</td>\n",
+       "      <td>79</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-02 06:00:00</td>\n",
+       "      <td>116</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-02 07:00:00</td>\n",
+       "      <td>116</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-02 08:00:00</td>\n",
+       "      <td>144</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-03 08:00:00</td>\n",
+       "      <td>144</td>\n",
+       "      <td>beat/min</td>\n",
+       "      <td>211</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value     units  itemid\n",
+       "0  185910.0 2166-08-26 03:00:00    79  beat/min     211\n",
+       "1  106266.0 2114-12-02 06:00:00   116  beat/min     211\n",
+       "2  106266.0 2114-12-02 07:00:00   116  beat/min     211\n",
+       "3  106266.0 2114-12-02 08:00:00   144  beat/min     211\n",
+       "4  106266.0 2114-12-03 08:00:00   144  beat/min     211"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(7952939, 5)\n",
+      "(2017-06-03 03:28:20)<< DONE (70.0s)\n",
+      "(2017-06-03 03:28:20)>> BLOOD PRESSURE SYSTOLIC\n",
+      "(2017-06-03 03:28:21)>>>> Extracting 14 items from chartevents\n",
+      "(2017-06-03 03:29:45)<<<< DONE (84.0s)\n",
+      "(2017-06-03 03:29:45)>>>> Combine DF\n",
+      "(2017-06-03 03:29:45)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:29:45)>>>> Clean UOM\n",
+      "(2017-06-03 03:29:48)<<<< DONE (3.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>176203.0</td>\n",
+       "      <td>2154-11-12 22:00:00</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>197569.0</td>\n",
+       "      <td>2133-03-09 00:00:00</td>\n",
+       "      <td>117</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>197569.0</td>\n",
+       "      <td>2133-03-09 01:00:00</td>\n",
+       "      <td>117</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>197569.0</td>\n",
+       "      <td>2133-03-09 02:00:00</td>\n",
+       "      <td>127</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>197569.0</td>\n",
+       "      <td>2133-03-09 03:00:00</td>\n",
+       "      <td>126</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value units  itemid\n",
+       "0  176203.0 2154-11-12 22:00:00                  51\n",
+       "1  197569.0 2133-03-09 00:00:00   117  mmHg      51\n",
+       "2  197569.0 2133-03-09 01:00:00   117  mmHg      51\n",
+       "3  197569.0 2133-03-09 02:00:00   127  mmHg      51\n",
+       "4  197569.0 2133-03-09 03:00:00   126  mmHg      51"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(6374824, 5)\n",
+      "(2017-06-03 03:30:00)<< DONE (100.0s)\n",
+      "(2017-06-03 03:30:00)>> BLOOD PRESSURE DIASTOLIC\n",
+      "(2017-06-03 03:30:00)>>>> Extracting 15 items from chartevents\n",
+      "(2017-06-03 03:31:18)<<<< DONE (78.0s)\n",
+      "(2017-06-03 03:31:18)>>>> Combine DF\n",
+      "(2017-06-03 03:31:19)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:31:19)>>>> Clean UOM\n",
+      "(2017-06-03 03:31:22)<<<< DONE (3.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>124321.0</td>\n",
+       "      <td>2157-10-21 12:15:00</td>\n",
+       "      <td>74</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>124321.0</td>\n",
+       "      <td>2157-10-21 13:00:00</td>\n",
+       "      <td>67</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>124321.0</td>\n",
+       "      <td>2157-10-21 14:00:00</td>\n",
+       "      <td>64</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>124321.0</td>\n",
+       "      <td>2157-10-21 15:00:00</td>\n",
+       "      <td>76</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>124321.0</td>\n",
+       "      <td>2157-10-21 16:17:00</td>\n",
+       "      <td>80</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220051</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value units  itemid\n",
+       "0  124321.0 2157-10-21 12:15:00    74  mmHg  220051\n",
+       "1  124321.0 2157-10-21 13:00:00    67  mmHg  220051\n",
+       "2  124321.0 2157-10-21 14:00:00    64  mmHg  220051\n",
+       "3  124321.0 2157-10-21 15:00:00    76  mmHg  220051\n",
+       "4  124321.0 2157-10-21 16:17:00    80  mmHg  220051"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(6371249, 5)\n",
+      "(2017-06-03 03:31:34)<< DONE (94.0s)\n",
+      "(2017-06-03 03:31:34)>> BLOOD PRESSURE MEAN\n",
+      "(2017-06-03 03:31:34)>>>> Extracting 3 items from chartevents\n",
+      "(2017-06-03 03:32:13)<<<< DONE (39.0s)\n",
+      "(2017-06-03 03:32:13)>>>> Combine DF\n",
+      "(2017-06-03 03:32:13)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:32:13)>>>> Clean UOM\n",
+      "(2017-06-03 03:32:14)<<<< DONE (1.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>124321</td>\n",
+       "      <td>2157-10-21 13:00:00</td>\n",
+       "      <td>86</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>124321</td>\n",
+       "      <td>2157-10-21 14:00:00</td>\n",
+       "      <td>86</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>124321</td>\n",
+       "      <td>2157-10-21 15:00:00</td>\n",
+       "      <td>98</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>124321</td>\n",
+       "      <td>2157-10-21 16:17:00</td>\n",
+       "      <td>104</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>124321</td>\n",
+       "      <td>2157-10-21 17:00:00</td>\n",
+       "      <td>104</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>220052</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value units  itemid\n",
+       "0  124321 2157-10-21 13:00:00    86  mmHg  220052\n",
+       "1  124321 2157-10-21 14:00:00    86  mmHg  220052\n",
+       "2  124321 2157-10-21 15:00:00    98  mmHg  220052\n",
+       "3  124321 2157-10-21 16:17:00   104  mmHg  220052\n",
+       "4  124321 2157-10-21 17:00:00   104  mmHg  220052"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2536271, 5)\n",
+      "(2017-06-03 03:32:18)<< DONE (44.0s)\n",
+      "(2017-06-03 03:32:18)>> RESPIRATORY RATE\n",
+      "(2017-06-03 03:32:18)>>>> Extracting 4 items from chartevents\n",
+      "(2017-06-03 03:34:08)<<<< DONE (110.0s)\n",
+      "(2017-06-03 03:34:08)>>>> Combine DF\n",
+      "(2017-06-03 03:34:08)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:34:08)>>>> Clean UOM\n",
+      "(2017-06-03 03:34:13)<<<< DONE (5.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:00:00</td>\n",
+       "      <td>20</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>122659.0</td>\n",
+       "      <td>2131-05-22 14:00:00</td>\n",
+       "      <td>29</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 19:00:00</td>\n",
+       "      <td>24</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>24</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-10 13:30:00</td>\n",
+       "      <td>22</td>\n",
+       "      <td>breath/min</td>\n",
+       "      <td>618</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value       units  itemid\n",
+       "0  185910.0 2166-08-25 00:00:00    20  breath/min     618\n",
+       "1  122659.0 2131-05-22 14:00:00    29  breath/min     618\n",
+       "2  188670.0 2183-08-23 19:00:00    24  breath/min     618\n",
+       "3  188670.0 2183-08-23 20:00:00    24  breath/min     618\n",
+       "4  185910.0 2166-08-10 13:30:00    22  breath/min     618"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(7810019, 5)\n",
+      "(2017-06-03 03:34:27)<< DONE (129.0s)\n",
+      "(2017-06-03 03:34:27)>> TEMPERATURE BODY\n",
+      "(2017-06-03 03:34:27)>>>> Extracting 4 items from chartevents\n",
+      "(2017-06-03 03:35:01)<<<< DONE (34.0s)\n",
+      "(2017-06-03 03:35:01)>>>> Combine DF\n",
+      "(2017-06-03 03:35:01)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:35:01)>>>> Clean UOM\n",
+      "(2017-06-03 03:35:02)<<<< DONE (1.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:00:00</td>\n",
+       "      <td>98.400001525878906</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>99.300003051757812</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-12 08:00:00</td>\n",
+       "      <td>98.699996948242188</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-13 17:00:00</td>\n",
+       "      <td>99.900001525878906</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>166707.0</td>\n",
+       "      <td>2122-02-11 20:00:00</td>\n",
+       "      <td>37.900001525878906</td>\n",
+       "      <td>degC</td>\n",
+       "      <td>676</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime               value units  itemid\n",
+       "0  185910.0 2166-08-25 00:00:00  98.400001525878906  degF     678\n",
+       "1  188670.0 2183-08-23 20:00:00  99.300003051757812  degF     678\n",
+       "2  185910.0 2166-08-12 08:00:00  98.699996948242188  degF     678\n",
+       "3  185910.0 2166-08-13 17:00:00  99.900001525878906  degF     678\n",
+       "4  166707.0 2122-02-11 20:00:00  37.900001525878906  degC     676"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(1751447, 5)\n",
+      "(2017-06-03 03:35:05)<< DONE (38.0s)\n",
+      "(2017-06-03 03:35:05)>> OXYGEN SATURATION PULSE OXIMETRY\n",
+      "(2017-06-03 03:35:06)>>>> Extracting 2 items from chartevents\n",
+      "(2017-06-03 03:35:59)<<<< DONE (53.0s)\n",
+      "(2017-06-03 03:35:59)>>>> Combine DF\n",
+      "(2017-06-03 03:35:59)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:35:59)>>>> Clean UOM\n",
+      "(2017-06-03 03:36:02)<<<< DONE (3.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>percent</td>\n",
+       "      <td>646</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:15:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>percent</td>\n",
+       "      <td>646</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>122659.0</td>\n",
+       "      <td>2131-05-22 14:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>percent</td>\n",
+       "      <td>646</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 19:00:00</td>\n",
+       "      <td>97</td>\n",
+       "      <td>percent</td>\n",
+       "      <td>646</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>97</td>\n",
+       "      <td>percent</td>\n",
+       "      <td>646</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value    units  itemid\n",
+       "0  185910.0 2166-08-25 00:00:00   100  percent     646\n",
+       "1  185910.0 2166-08-25 00:15:00   100  percent     646\n",
+       "2  122659.0 2131-05-22 14:00:00   100  percent     646\n",
+       "3  188670.0 2183-08-23 19:00:00    97  percent     646\n",
+       "4  188670.0 2183-08-23 20:00:00    97  percent     646"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(6099827, 5)\n",
+      "(2017-06-03 03:36:14)<< DONE (69.0s)\n",
+      "(2017-06-03 03:36:14)>> WEIGHT BODY\n",
+      "(2017-06-03 03:36:14)>>>> Extracting 3 items from chartevents\n",
+      "(2017-06-03 03:36:48)<<<< DONE (34.0s)\n",
+      "(2017-06-03 03:36:48)>>>> Combine DF\n",
+      "(2017-06-03 03:36:49)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:36:49)>>>> Clean UOM\n",
+      "(2017-06-03 03:36:49)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-20 06:00:00</td>\n",
+       "      <td>102.5</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>763</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>166707.0</td>\n",
+       "      <td>2122-02-15 07:00:00</td>\n",
+       "      <td>99.400001525878906</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>763</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>182104.0</td>\n",
+       "      <td>2131-05-05 06:00:00</td>\n",
+       "      <td>109.69999694824219</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>763</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>157907.0</td>\n",
+       "      <td>2129-06-10 05:00:00</td>\n",
+       "      <td>103.19999694824219</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>763</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>166707.0</td>\n",
+       "      <td>2122-02-14 06:00:00</td>\n",
+       "      <td>101.80000305175781</td>\n",
+       "      <td>kg</td>\n",
+       "      <td>763</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime               value units  itemid\n",
+       "0  185910.0 2166-08-20 06:00:00               102.5    kg     763\n",
+       "1  166707.0 2122-02-15 07:00:00  99.400001525878906    kg     763\n",
+       "2  182104.0 2131-05-05 06:00:00  109.69999694824219    kg     763\n",
+       "3  157907.0 2129-06-10 05:00:00  103.19999694824219    kg     763\n",
+       "4  166707.0 2122-02-14 06:00:00  101.80000305175781    kg     763"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(95425, 5)\n",
+      "(2017-06-03 03:36:49)<< DONE (35.0s)\n",
+      "(2017-06-03 03:36:49)>> OUTPUT URINE\n",
+      "(2017-06-03 03:36:49)>>>> Extracting 2 items from chartevents\n",
+      "(2017-06-03 03:37:28)<<<< DONE (39.0s)\n",
+      "(2017-06-03 03:37:28)>>>> Extracting 29 items from outputevents\n",
+      "(2017-06-03 03:37:59)<<<< DONE (31.0s)\n",
+      "(2017-06-03 03:37:59)>>>> Combine DF\n",
+      "(2017-06-03 03:37:59)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:37:59)>>>> Clean UOM\n",
+      "(2017-06-03 03:38:09)<<<< DONE (10.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-03 08:00:00</td>\n",
+       "      <td>Voiding qs</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>3686</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-09 09:00:00</td>\n",
+       "      <td>Voiding qs</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>3686</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-09 14:00:00</td>\n",
+       "      <td>Voiding qs</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>3686</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-05 21:30:00</td>\n",
+       "      <td>Voiding qs</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>3686</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>106266.0</td>\n",
+       "      <td>2114-12-04 16:00:00</td>\n",
+       "      <td>Voiding qs</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>3686</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime       value units  itemid\n",
+       "0  106266.0 2114-12-03 08:00:00  Voiding qs    ml    3686\n",
+       "1  106266.0 2114-12-09 09:00:00  Voiding qs    ml    3686\n",
+       "2  106266.0 2114-12-09 14:00:00  Voiding qs    ml    3686\n",
+       "3  106266.0 2114-12-05 21:30:00  Voiding qs    ml    3686\n",
+       "4  106266.0 2114-12-04 16:00:00  Voiding qs    ml    3686"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(3644639, 5)\n",
+      "(2017-06-03 03:38:15)<< DONE (86.0s)\n",
+      "(2017-06-03 03:38:15)>> GLASGOW COMA SCALE MOTOR\n",
+      "(2017-06-03 03:38:15)>>>> Extracting 1 items from chartevents\n",
+      "(2017-06-03 03:39:12)<<<< DONE (57.0s)\n",
+      "(2017-06-03 03:39:12)>>>> Combine DF\n",
+      "(2017-06-03 03:39:12)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:39:12)>>>> Clean UOM\n",
+      "(2017-06-03 03:39:12)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:00:00</td>\n",
+       "      <td>6 Obeys Commands</td>\n",
+       "      <td></td>\n",
+       "      <td>454</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>6 Obeys Commands</td>\n",
+       "      <td></td>\n",
+       "      <td>454</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-27 12:00:00</td>\n",
+       "      <td>5 Localizes Pain</td>\n",
+       "      <td></td>\n",
+       "      <td>454</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-09-03 12:00:00</td>\n",
+       "      <td>6 Obeys Commands</td>\n",
+       "      <td></td>\n",
+       "      <td>454</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>101757.0</td>\n",
+       "      <td>2133-01-03 16:00:00</td>\n",
+       "      <td>6 Obeys Commands</td>\n",
+       "      <td></td>\n",
+       "      <td>454</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime             value units  itemid\n",
+       "0  185910.0 2166-08-25 00:00:00  6 Obeys Commands           454\n",
+       "1  188670.0 2183-08-23 20:00:00  6 Obeys Commands           454\n",
+       "2  185910.0 2166-08-27 12:00:00  5 Localizes Pain           454\n",
+       "3  185910.0 2166-09-03 12:00:00  6 Obeys Commands           454\n",
+       "4  101757.0 2133-01-03 16:00:00  6 Obeys Commands           454"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(952565, 5)\n",
+      "(2017-06-03 03:39:13)<< DONE (58.0s)\n",
+      "(2017-06-03 03:39:13)>> GLASGOW COMA SCALE EYE OPENING\n",
+      "(2017-06-03 03:39:13)>>>> Extracting 1 items from chartevents\n",
+      "(2017-06-03 03:39:57)<<<< DONE (44.0s)\n",
+      "(2017-06-03 03:39:57)>>>> Combine DF\n",
+      "(2017-06-03 03:39:57)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:39:57)>>>> Clean UOM\n",
+      "(2017-06-03 03:39:57)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>4 Spontaneously</td>\n",
+       "      <td></td>\n",
+       "      <td>184</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-15 20:00:00</td>\n",
+       "      <td>4 Spontaneously</td>\n",
+       "      <td></td>\n",
+       "      <td>184</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-16 16:00:00</td>\n",
+       "      <td>3 To speech</td>\n",
+       "      <td></td>\n",
+       "      <td>184</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-23 04:00:00</td>\n",
+       "      <td>3 To speech</td>\n",
+       "      <td></td>\n",
+       "      <td>184</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-27 12:00:00</td>\n",
+       "      <td>1 No Response</td>\n",
+       "      <td></td>\n",
+       "      <td>184</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime            value units  itemid\n",
+       "0  188670.0 2183-08-23 20:00:00  4 Spontaneously           184\n",
+       "1  185910.0 2166-08-15 20:00:00  4 Spontaneously           184\n",
+       "2  185910.0 2166-08-16 16:00:00      3 To speech           184\n",
+       "3  185910.0 2166-08-23 04:00:00      3 To speech           184\n",
+       "4  185910.0 2166-08-27 12:00:00    1 No Response           184"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(956672, 5)\n",
+      "(2017-06-03 03:39:58)<< DONE (45.0s)\n",
+      "(2017-06-03 03:39:58)>> GLASGOW COMA SCALE VERBAL\n",
+      "(2017-06-03 03:39:59)>>>> Extracting 1 items from chartevents\n",
+      "(2017-06-03 03:40:22)<<<< DONE (23.0s)\n",
+      "(2017-06-03 03:40:22)>>>> Combine DF\n",
+      "(2017-06-03 03:40:22)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:40:22)>>>> Clean UOM\n",
+      "(2017-06-03 03:40:22)<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:00:00</td>\n",
+       "      <td>1.0 ET/Trach</td>\n",
+       "      <td></td>\n",
+       "      <td>723</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>4 Confused</td>\n",
+       "      <td></td>\n",
+       "      <td>723</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-12 08:00:00</td>\n",
+       "      <td>1.0 ET/Trach</td>\n",
+       "      <td></td>\n",
+       "      <td>723</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-27 12:00:00</td>\n",
+       "      <td>1.0 ET/Trach</td>\n",
+       "      <td></td>\n",
+       "      <td>723</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>166707.0</td>\n",
+       "      <td>2122-02-11 20:00:00</td>\n",
+       "      <td>5 Oriented</td>\n",
+       "      <td></td>\n",
+       "      <td>723</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime         value units  itemid\n",
+       "0  185910.0 2166-08-25 00:00:00  1.0 ET/Trach           723\n",
+       "1  188670.0 2183-08-23 20:00:00    4 Confused           723\n",
+       "2  185910.0 2166-08-12 08:00:00  1.0 ET/Trach           723\n",
+       "3  185910.0 2166-08-27 12:00:00  1.0 ET/Trach           723\n",
+       "4  166707.0 2122-02-11 20:00:00    5 Oriented           723"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(954700, 5)\n",
+      "(2017-06-03 03:40:24)<< DONE (26.0s)\n",
+      "(2017-06-03 03:40:24)>> NORMAL SALINE\n",
+      "(2017-06-03 03:40:24)>>>> Extracting 2 items from chartevents\n",
+      "(2017-06-03 03:40:24)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:40:24)>>>> Extracting 4 items from inputevents_cv\n",
+      "(2017-06-03 03:40:25)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:40:25)>>>> Extracting 2 items from inputevents_mv\n",
+      "(2017-06-03 03:40:43)<<<< DONE (18.0s)\n",
+      "(2017-06-03 03:40:43)>>>> Combine DF\n",
+      "(2017-06-03 03:40:43)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:40:43)>>>> Clean UOM\n",
+      "(2017-06-03 03:40:46)<<<< DONE (3.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>110468</td>\n",
+       "      <td>2134-02-13 03:45:00</td>\n",
+       "      <td>given</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>4647</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>110468</td>\n",
+       "      <td>2134-02-13 07:05:00</td>\n",
+       "      <td>given</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>4647</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>175419</td>\n",
+       "      <td>2122-08-16 01:00:00</td>\n",
+       "      <td>given</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>4647</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>143494</td>\n",
+       "      <td>2147-07-02 23:00:00</td>\n",
+       "      <td>given</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>4647</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>143494</td>\n",
+       "      <td>2147-07-02 23:43:00</td>\n",
+       "      <td>given</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>4647</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime  value units  itemid\n",
+       "0  110468 2134-02-13 03:45:00  given    ml    4647\n",
+       "1  110468 2134-02-13 07:05:00  given    ml    4647\n",
+       "2  175419 2122-08-16 01:00:00  given    ml    4647\n",
+       "3  143494 2147-07-02 23:00:00  given    ml    4647\n",
+       "4  143494 2147-07-02 23:43:00  given    ml    4647"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(817373, 5)\n",
+      "(2017-06-03 03:40:46)<< DONE (22.0s)\n",
+      "(2017-06-03 03:40:46)>> LACTATED RINGERS\n",
+      "(2017-06-03 03:40:46)>>>> Extracting 2 items from chartevents\n",
+      "(2017-06-03 03:40:46)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:40:46)>>>> Extracting 7 items from inputevents_cv\n",
+      "(2017-06-03 03:40:50)<<<< DONE (4.0s)\n",
+      "(2017-06-03 03:40:50)>>>> Extracting 2 items from inputevents_mv\n",
+      "(2017-06-03 03:40:51)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:40:51)>>>> Combine DF\n",
+      "(2017-06-03 03:40:51)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:40:51)>>>> Clean UOM\n",
+      "(2017-06-03 03:40:53)<<<< DONE (2.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>194762.0</td>\n",
+       "      <td>2110-11-22 18:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>1634</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>178769.0</td>\n",
+       "      <td>2181-06-01 05:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>2971</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>178769.0</td>\n",
+       "      <td>2181-06-01 01:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>2971</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>178769.0</td>\n",
+       "      <td>2181-06-01 02:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>2971</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>178769.0</td>\n",
+       "      <td>2181-06-01 03:00:00</td>\n",
+       "      <td>100</td>\n",
+       "      <td>ml</td>\n",
+       "      <td>2971</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value units  itemid\n",
+       "0  194762.0 2110-11-22 18:00:00   100    ml    1634\n",
+       "1  178769.0 2181-06-01 05:00:00   100    ml    2971\n",
+       "2  178769.0 2181-06-01 01:00:00   100    ml    2971\n",
+       "3  178769.0 2181-06-01 02:00:00   100    ml    2971\n",
+       "4  178769.0 2181-06-01 03:00:00   100    ml    2971"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(504306, 5)\n",
+      "(2017-06-03 03:40:53)<< DONE (7.0s)\n",
+      "(2017-06-03 03:40:53)>> NOREPINEPHRINE\n",
+      "(2017-06-03 03:40:53)>>>> Extracting 2 items from inputevents_cv\n",
+      "(2017-06-03 03:41:10)<<<< DONE (17.0s)\n",
+      "(2017-06-03 03:41:10)>>>> Extracting 1 items from inputevents_mv\n",
+      "(2017-06-03 03:41:12)<<<< DONE (2.0s)\n",
+      "(2017-06-03 03:41:12)>>>> Combine DF\n",
+      "(2017-06-03 03:41:12)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:41:12)>>>> Clean UOM\n",
+      "(2017-06-03 03:41:16)<<<< DONE (4.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>181516.0</td>\n",
+       "      <td>2121-01-27 00:00:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>30120</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>194502.0</td>\n",
+       "      <td>2102-12-20 08:00:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>30047</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>172260.0</td>\n",
+       "      <td>2124-11-11 16:00:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>30047</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>114829.0</td>\n",
+       "      <td>2107-01-15 22:00:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>30047</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>181516.0</td>\n",
+       "      <td>2121-01-27 01:00:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>mg</td>\n",
+       "      <td>30120</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime  value units  itemid\n",
+       "0  181516.0 2121-01-27 00:00:00    NaN    mg   30120\n",
+       "1  194502.0 2102-12-20 08:00:00    NaN    mg   30047\n",
+       "2  172260.0 2124-11-11 16:00:00    NaN    mg   30047\n",
+       "3  114829.0 2107-01-15 22:00:00    NaN    mg   30047\n",
+       "4  181516.0 2121-01-27 01:00:00    NaN    mg   30120"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(1136938, 5)\n",
+      "(2017-06-03 03:41:16)<< DONE (23.0s)\n",
+      "(2017-06-03 03:41:16)>> VASOPRESSIN\n",
+      "(2017-06-03 03:41:16)>>>> Extracting 10 items from chartevents\n",
+      "(2017-06-03 03:41:17)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:41:17)>>>> Extracting 4 items from inputevents_cv\n",
+      "(2017-06-03 03:41:22)<<<< DONE (5.0s)\n",
+      "(2017-06-03 03:41:22)>>>> Extracting 1 items from inputevents_mv\n",
+      "(2017-06-03 03:41:23)<<<< DONE (1.0s)\n",
+      "(2017-06-03 03:41:23)>>>> Combine DF\n",
+      "(2017-06-03 03:41:23)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:41:23)>>>> Clean UOM\n",
+      "(2017-06-03 03:41:24)<<<< DONE (1.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>126005.0</td>\n",
+       "      <td>2126-09-05 16:30:00</td>\n",
+       "      <td></td>\n",
+       "      <td>U</td>\n",
+       "      <td>1136</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>126005.0</td>\n",
+       "      <td>2126-09-05 16:45:00</td>\n",
+       "      <td></td>\n",
+       "      <td>units/hour</td>\n",
+       "      <td>1136</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>115221.0</td>\n",
+       "      <td>2194-12-09 05:00:00</td>\n",
+       "      <td>3</td>\n",
+       "      <td>U</td>\n",
+       "      <td>1136</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>115221.0</td>\n",
+       "      <td>2194-12-09 06:00:00</td>\n",
+       "      <td>3</td>\n",
+       "      <td>units/hour</td>\n",
+       "      <td>1136</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>115221.0</td>\n",
+       "      <td>2194-12-09 04:00:00</td>\n",
+       "      <td>3</td>\n",
+       "      <td>units/hour</td>\n",
+       "      <td>1136</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value       units  itemid\n",
+       "0  126005.0 2126-09-05 16:30:00                 U    1136\n",
+       "1  126005.0 2126-09-05 16:45:00        units/hour    1136\n",
+       "2  115221.0 2194-12-09 05:00:00     3           U    1136\n",
+       "3  115221.0 2194-12-09 06:00:00     3  units/hour    1136\n",
+       "4  115221.0 2194-12-09 04:00:00     3  units/hour    1136"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(339184, 5)\n",
+      "(2017-06-03 03:41:24)<< DONE (8.0s)\n",
+      "(2017-06-03 03:41:24)>> HEMOGLOBIN\n",
+      "(2017-06-03 03:41:24)>>>> Extracting 3 items from chartevents\n",
+      "(2017-06-03 03:43:00)<<<< DONE (96.0s)\n",
+      "(2017-06-03 03:43:00)>>>> Extracting 2 items from labevents\n",
+      "(2017-06-03 03:43:27)<<<< DONE (27.0s)\n",
+      "(2017-06-03 03:43:27)>>>> Combine DF\n",
+      "(2017-06-03 03:43:27)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:43:27)>>>> Clean UOM\n",
+      "(2017-06-03 03:43:30)<<<< DONE (3.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-13 01:53:00</td>\n",
+       "      <td>9.5</td>\n",
+       "      <td>gm/dl</td>\n",
+       "      <td>814</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-22 02:14:00</td>\n",
+       "      <td>10</td>\n",
+       "      <td>gm/dl</td>\n",
+       "      <td>814</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-18 03:46:00</td>\n",
+       "      <td>10.100000381469727</td>\n",
+       "      <td>gm/dl</td>\n",
+       "      <td>814</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>157907.0</td>\n",
+       "      <td>2129-06-11 02:00:00</td>\n",
+       "      <td>9.8999996185302734</td>\n",
+       "      <td>gm/dl</td>\n",
+       "      <td>814</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-30 02:07:00</td>\n",
+       "      <td>9</td>\n",
+       "      <td>gm/dl</td>\n",
+       "      <td>814</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime               value  units  itemid\n",
+       "0  185910.0 2166-08-13 01:53:00                 9.5  gm/dl     814\n",
+       "1  185910.0 2166-08-22 02:14:00                  10  gm/dl     814\n",
+       "2  185910.0 2166-08-18 03:46:00  10.100000381469727  gm/dl     814\n",
+       "3  157907.0 2129-06-11 02:00:00  9.8999996185302734  gm/dl     814\n",
+       "4  185910.0 2166-08-30 02:07:00                   9  gm/dl     814"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(1167921, 5)\n",
+      "(2017-06-03 03:43:31)<< DONE (127.0s)\n",
+      "(2017-06-03 03:43:31)>> LACTATE\n",
+      "(2017-06-03 03:43:31)>>>> Extracting 3 items from chartevents\n",
+      "(2017-06-03 03:44:30)<<<< DONE (59.0s)\n",
+      "(2017-06-03 03:44:30)>>>> Extracting 1 items from labevents\n",
+      "(2017-06-03 03:44:33)<<<< DONE (3.0s)\n",
+      "(2017-06-03 03:44:33)>>>> Combine DF\n",
+      "(2017-06-03 03:44:33)<<<< DONE (0.0s)\n",
+      "(2017-06-03 03:44:33)>>>> Clean UOM\n",
+      "(2017-06-03 03:44:34)<<<< DONE (1.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-11 21:20:00</td>\n",
+       "      <td>1.5</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>818</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-11 21:20:00</td>\n",
+       "      <td>1.5</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>1531</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>175413.0</td>\n",
+       "      <td>2170-04-11 15:00:00</td>\n",
+       "      <td></td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>818</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>146828.0</td>\n",
+       "      <td>2186-10-03 21:54:00</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>818</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>146828.0</td>\n",
+       "      <td>2186-10-03 21:54:00</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>1531</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "         id            datetime value   units  itemid\n",
+       "0  185910.0 2166-08-11 21:20:00   1.5  mmol/L     818\n",
+       "1  185910.0 2166-08-11 21:20:00   1.5  mmol/L    1531\n",
+       "2  175413.0 2170-04-11 15:00:00        mmol/L     818\n",
+       "3  146828.0 2186-10-03 21:54:00   1.8  mmol/L     818\n",
+       "4  146828.0 2186-10-03 21:54:00   1.8  mmol/L    1531"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(393608, 5)\n",
+      "(2017-06-03 03:44:35)<< DONE (64.0s)\n",
+      "(2017-06-03 03:44:35) DONE (1045.0s)\n"
+     ]
+    }
+   ],
+   "source": [
+    "df_all = extract_labels(conn,labels,item_map_fname,hdf5_fname)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Transform (and \"Load\") MIMIC III Data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 152,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "import icu_data_defs \n",
+    "import mimic\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "import logger\n",
+    "import pandas as pd\n",
+    "from constants import column_names\n",
+    "import utils\n",
+    "import warnings\n",
+    "warnings.filterwarnings('ignore')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 153,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(utils)\n",
+    "reload(logger)\n",
+    "reload(mimic)\n",
+    "def transform_extracted_labels(labels,hdf5_fname):\n",
+    "    \n",
+    "    pipeline = Pipeline([\n",
+    "        ('clean',mimic.clean_extract()),\n",
+    "        ('unstack',mimic.unstacker()),\n",
+    "        ('clean_uom',mimic.clean_uom())\n",
+    "    ])\n",
+    "    \n",
+    "    for label in labels:\n",
+    "        logger.log('Opening {}'.format(label.upper()))\n",
+    "        df = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n",
+    "        logger.log('Transforming {} - {}'.format(label.upper(),df.shape))\n",
+    "        df_transformed = pipeline.transform(df)\n",
+    "        # Add label guess to column index\n",
+    "        df = utils.add_same_val__index_level(df,label,'label',axis=1)\n",
+    "        display(df_transformed.head())\n",
+    "        utils.save_df(df_transformed,hdf5_fname,'transformed/{}'.format(label))\n",
+    "        del df,df_transformed\n",
+    "        logger.end_log_level()\n",
+    "        \n",
+    "    return\n",
+    "        \n",
+    "mimic_data_sef_fname = 'config/data_definitions.xlsx'\n",
+    "hdf5_fname = 'data/mimic_data'\n",
+    "\n",
+    "#get all labels\n",
+    "data_dict = icu_data_defs.data_dictionary(mimic_data_sef_fname)\n",
+    "simple_data = data_dict.get_panel_defintions(12) #12 is \"simple data\"\n",
+    "labels = simple_data.label.unique().tolist()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-02 05:11:14) Opening HEART RATE\n",
+      "(2017-06-02 05:11:19) DONE (5.0s)\n",
+      "(2017-06-02 05:11:19) Transforming HEART RATE - (7952939, 5)\n"
+     ]
+    },
+    {
+     "ename": "KeyboardInterrupt",
+     "evalue": "",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
+      "\u001b[1;32m<ipython-input-3-4ff30e8e4bcc>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mtransform_extracted_labels\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabels\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
+      "\u001b[1;32m<ipython-input-2-7e9518f41127>\u001b[0m in \u001b[0;36mtransform_extracted_labels\u001b[1;34m(labels, hdf5_fname)\u001b[0m\n\u001b[0;32m     14\u001b[0m         \u001b[0mdf\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mutils\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mopen_df\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'extract/{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabel\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     15\u001b[0m         \u001b[0mlogger\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mlog\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'Transforming {} - {}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabel\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mupper\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 16\u001b[1;33m         \u001b[0mdf_transformed\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mpipeline\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mtransform\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     17\u001b[0m         \u001b[0mdisplay\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf_transformed\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mhead\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     18\u001b[0m         \u001b[0mutils\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msave_df\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf_transformed\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'transformed/{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mlabel\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\sklearn\\pipeline.pyc\u001b[0m in \u001b[0;36m_transform\u001b[1;34m(self, X)\u001b[0m\n\u001b[0;32m    446\u001b[0m         \u001b[1;32mfor\u001b[0m \u001b[0mname\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mtransform\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msteps\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    447\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mtransform\u001b[0m \u001b[1;32mis\u001b[0m \u001b[1;32mnot\u001b[0m \u001b[0mNone\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 448\u001b[1;33m                 \u001b[0mXt\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mtransform\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mtransform\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mXt\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    449\u001b[0m         \u001b[1;32mreturn\u001b[0m \u001b[0mXt\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    450\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\mimic.pyc\u001b[0m in \u001b[0;36mtransform\u001b[1;34m(self, df)\u001b[0m\n\u001b[0;32m    189\u001b[0m         \u001b[0mFORMAT\u001b[0m \u001b[0mpre\u001b[0m\u001b[1;33m-\u001b[0m\u001b[0munstack\u001b[0m \u001b[0mcolumns\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    190\u001b[0m         \"\"\"\n\u001b[1;32m--> 191\u001b[1;33m         \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mreplace\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mto_replace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m''\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mpd\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnp\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnan\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    192\u001b[0m         \u001b[1;31m#drop NAN record_id, timestamps, or value\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    193\u001b[0m         \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mdropna\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0msubset\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mcolumn_names\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mID\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcolumn_names\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mDATETIME\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcolumn_names\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mVALUE\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mhow\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m'any'\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\generic.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, to_replace, value, inplace, limit, regex, method, axis)\u001b[0m\n\u001b[0;32m   3538\u001b[0m                     new_data = self._data.replace(to_replace=to_replace,\n\u001b[0;32m   3539\u001b[0m                                                   \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mvalue\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0minplace\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 3540\u001b[1;33m                                                   regex=regex)\n\u001b[0m\u001b[0;32m   3541\u001b[0m                 \u001b[1;32melse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   3542\u001b[0m                     msg = ('Invalid \"to_replace\" type: '\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, **kwargs)\u001b[0m\n\u001b[0;32m   3172\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   3173\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mreplace\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 3174\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mapply\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'replace'\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   3175\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   3176\u001b[0m     def replace_list(self, src_list, dest_list, inplace=False, regex=False,\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mapply\u001b[1;34m(self, f, axes, filter, do_integrity_check, consolidate, **kwargs)\u001b[0m\n\u001b[0;32m   3033\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   3034\u001b[0m             \u001b[0mkwargs\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'mgr'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 3035\u001b[1;33m             \u001b[0mapplied\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mgetattr\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mb\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mf\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m   3036\u001b[0m             \u001b[0mresult_blocks\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0m_extend_blocks\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mapplied\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mresult_blocks\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   3037\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, to_replace, value, inplace, filter, regex, convert, mgr)\u001b[0m\n\u001b[0;32m   1926\u001b[0m                                                     \u001b[0minplace\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0minplace\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   1927\u001b[0m                                                     \u001b[0mfilter\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mfilter\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mregex\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mregex\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m-> 1928\u001b[1;33m                                                     convert=convert, mgr=mgr)\n\u001b[0m\u001b[0;32m   1929\u001b[0m         \u001b[1;32melif\u001b[0m \u001b[0mboth_lists\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   1930\u001b[0m             \u001b[1;32mfor\u001b[0m \u001b[0mto_rep\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mv\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mzip\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mto_replace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\internals.pyc\u001b[0m in \u001b[0;36mreplace\u001b[1;34m(self, to_replace, value, inplace, filter, regex, convert, mgr)\u001b[0m\n\u001b[0;32m    623\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    624\u001b[0m         \u001b[0moriginal_to_replace\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mto_replace\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 625\u001b[1;33m         \u001b[0mmask\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0misnull\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    626\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    627\u001b[0m         \u001b[1;31m# try to replace, if we raise an error, convert to ObjectBlock and\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\types\\missing.pyc\u001b[0m in \u001b[0;36misnull\u001b[1;34m(obj)\u001b[0m\n\u001b[0;32m     43\u001b[0m     \u001b[0mpandas\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mnotnull\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mboolean\u001b[0m \u001b[0minverse\u001b[0m \u001b[0mof\u001b[0m \u001b[0mpandas\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0misnull\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     44\u001b[0m     \"\"\"\n\u001b[1;32m---> 45\u001b[1;33m     \u001b[1;32mreturn\u001b[0m \u001b[0m_isnull\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     46\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     47\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\types\\missing.pyc\u001b[0m in \u001b[0;36m_isnull_new\u001b[1;34m(obj)\u001b[0m\n\u001b[0;32m     53\u001b[0m         \u001b[1;32mraise\u001b[0m \u001b[0mNotImplementedError\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m\"isnull is not defined for MultiIndex\"\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     54\u001b[0m     \u001b[1;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mABCSeries\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mndarray\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mABCIndexClass\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 55\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0m_isnull_ndarraylike\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     56\u001b[0m     \u001b[1;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mABCGeneric\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     57\u001b[0m         \u001b[1;32mreturn\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_constructor\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_data\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0misnull\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mfunc\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0misnull\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\types\\missing.pyc\u001b[0m in \u001b[0;36m_isnull_ndarraylike\u001b[1;34m(obj)\u001b[0m\n\u001b[0;32m    139\u001b[0m                 \u001b[0mresult\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mempty\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mbool\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    140\u001b[0m                 \u001b[0mvec\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mlib\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0misnullobj\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mvalues\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mravel\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 141\u001b[1;33m                 \u001b[0mresult\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;33m.\u001b[0m\u001b[1;33m.\u001b[0m\u001b[1;33m.\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvec\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mreshape\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    142\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    143\u001b[0m     \u001b[1;32melif\u001b[0m \u001b[0mneeds_i8_conversion\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;31mKeyboardInterrupt\u001b[0m: "
+     ]
+    }
+   ],
+   "source": [
+    "transform_extracted_labels(labels,hdf5_fname)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "store = pd.HDFStore(hdf5_fname)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<class 'pandas.io.pytables.HDFStore'>\n",
+       "File path: data/mimic_data\n",
+       "/extract/blood pressure diastolic                        frame        (shape->[6371249,5])\n",
+       "/extract/blood pressure mean                             frame        (shape->[2536271,5])\n",
+       "/extract/blood pressure systolic                         frame        (shape->[6374824,5])\n",
+       "/extract/glasgow coma scale eye opening                  frame        (shape->[956672,5]) \n",
+       "/extract/glasgow coma scale motor                        frame        (shape->[952565,5]) \n",
+       "/extract/glasgow coma scale verbal                       frame        (shape->[954700,5]) \n",
+       "/extract/heart rate                                      frame        (shape->[7952939,5])\n",
+       "/extract/hemoglobin                                      frame        (shape->[1167921,5])\n",
+       "/extract/lactate                                         frame        (shape->[393608,5]) \n",
+       "/extract/lactated ringers                                frame        (shape->[504306,5]) \n",
+       "/extract/norepinephrine                                  frame        (shape->[1136938,5])\n",
+       "/extract/normal saline                                   frame        (shape->[817373,5]) \n",
+       "/extract/output urine                                    frame        (shape->[3644639,5])\n",
+       "/extract/oxygen saturation pulse oximetry                frame        (shape->[6099827,5])\n",
+       "/extract/respiratory rate                                frame        (shape->[7810019,5])\n",
+       "/extract/temperature body                                frame        (shape->[1751447,5])\n",
+       "/extract/vasopressin                                     frame        (shape->[339184,5]) \n",
+       "/extract/weight body                                     frame        (shape->[95425,5])  \n",
+       "/transformed/blood pressure diastolic                    frame                            \n",
+       "/transformed/blood pressure mean                         frame                            \n",
+       "/transformed/blood pressure systolic                     frame                            \n",
+       "/transformed/glasgow coma scale eye opening              frame                            \n",
+       "/transformed/glasgow coma scale motor                    frame                            \n",
+       "/transformed/glasgow coma scale verbal                   frame                            \n",
+       "/transformed/heart rate                                  frame                            \n",
+       "/transformed/hemoglobin                                  frame                            \n",
+       "/transformed/lactate                                     frame                            \n",
+       "/transformed/lactated ringers                            frame                            \n",
+       "/transformed/norepinephrine                              frame                            \n",
+       "/transformed/normal saline                               frame                            \n",
+       "/transformed/output urine                                frame                            \n",
+       "/transformed/oxygen saturation pulse oximetry            frame                            \n",
+       "/transformed/respiratory rate                            frame                            \n",
+       "/transformed/temperature body                            frame                            \n",
+       "/transformed/vasopressin                                 frame                            \n",
+       "/transformed/weight body                                 frame                            "
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "store"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "store.close()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 116,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<module 'utils' from 'utils.py'>"
+      ]
+     },
+     "execution_count": 116,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "reload(utils)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Cleaners"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Design decision: If a given column has both NUMERIC CATEGORICAL and QUANTITATIVE data, all NUMERIC CATEGORICAL data will actually be treated like QUANTITATIVE data, unfortunately."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "import transformers\n",
+    "import utils\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "from units import MedicalUreg\n",
+    "import icu_data_defs\n",
+    "import units\n",
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(transformers)\n",
+    "reload(utils)\n",
+    "mimic_data_sef_fname = 'config/data_definitions.xlsx'\n",
+    "hdf5_fname = 'data/mimic_data'\n",
+    "medical_units = 'config/medical_units.txt'\n",
+    "\n",
+    "#get all labels\n",
+    "data_dict = icu_data_defs.data_dictionary(mimic_data_sef_fname)\n",
+    "label = 'lactate'\n",
+    "\n",
+    "standard_pipeline = Pipeline([\n",
+    "        ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func=lambda x:x.iloc[0])),\n",
+    "        ('split_dtype',transformers.split_dtype()),\n",
+    "        ('format_columns',transformers.format_columns(data_dict,MedicalUreg(medical_units))),\n",
+    "        ('drop_small_columns',transformers.remove_small_columns(threshold=50))\n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "transformers.py:103: SettingWithCopyWarning: \n",
+      "A value is trying to be set on a copy of a slice from a DataFrame\n",
+      "\n",
+      "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy\n",
+      "  df_out.dropna(how='all',inplace=True,axis=1)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "(113L, 0, '0.0%')"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df = utils.open_df('data/mimic_data','transformed/{}'.format(label))\n",
+    "df_cleaned = standard_pipeline.transform(df)\n",
+    "utils.data_loss(df,df_cleaned)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 216,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"6\" halign=\"left\">lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">mmol/L</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">no_units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>50813</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>818</th>\n",
+       "      <th>1531</th>\n",
+       "      <th>50813(mmol/L)</th>\n",
+       "      <th>818</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>100001</th>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100003</th>\n",
+       "      <th>2150-04-17 19:12:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100006</th>\n",
+       "      <th>2108-04-08 10:58:00</th>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100007</th>\n",
+       "      <th>2145-03-31 00:44:00</th>\n",
+       "      <td>3.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2145-04-02 14:10:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100009</th>\n",
+       "      <th>2162-05-17 13:19:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2162-05-17 17:14:00</th>\n",
+       "      <td>1.5</td>\n",
+       "      <td>1.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">100010</th>\n",
+       "      <th>2109-12-10 10:25:00</th>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 12:11:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:05:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:58:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100011</th>\n",
+       "      <th>2177-08-29 04:44:00</th>\n",
+       "      <td>3.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-08-29 06:55:00</th>\n",
+       "      <td>2.3</td>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100012</th>\n",
+       "      <th>2177-03-14 07:38:00</th>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-14 11:42:00</th>\n",
+       "      <td>2.5</td>\n",
+       "      <td>2.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 08:05:00</th>\n",
+       "      <td>2.1</td>\n",
+       "      <td>2.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 14:01:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 21:42:00</th>\n",
+       "      <td>1.8</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100016</th>\n",
+       "      <th>2188-05-24 12:00:00</th>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100017</th>\n",
+       "      <th>2103-03-11 05:10:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100018</th>\n",
+       "      <th>2176-08-29 15:29:00</th>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 09:23:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 10:19:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 11:29:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 12:40:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100020</th>\n",
+       "      <th>2142-11-30 21:54:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2142-12-03 00:17:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100024</th>\n",
+       "      <th>2170-09-19 10:25:00</th>\n",
+       "      <td>1.4</td>\n",
+       "      <td>1.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-19 16:33:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-20 02:04:00</th>\n",
+       "      <td>3.2</td>\n",
+       "      <td>3.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199976</th>\n",
+       "      <th>2182-02-14 11:15:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-16 03:57:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-19 03:59:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-20 03:31:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-21 04:55:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199979</th>\n",
+       "      <th>2182-02-06 09:17:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-06 14:16:00</th>\n",
+       "      <td>3.8</td>\n",
+       "      <td>3.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">199981</th>\n",
+       "      <th>2110-09-24 16:34:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-24 20:09:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-25 06:10:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>199987</th>\n",
+       "      <th>2175-05-19 16:30:00</th>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"6\" valign=\"top\">199988</th>\n",
+       "      <th>2169-01-24 12:48:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 01:35:00</th>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 11:18:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 16:43:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 22:35:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-10 05:33:00</th>\n",
+       "      <td>1.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199993</th>\n",
+       "      <th>2161-11-12 23:14:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2161-11-13 03:46:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">199994</th>\n",
+       "      <th>2188-07-07 21:23:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 03:09:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 04:13:00</th>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 06:20:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199998</th>\n",
+       "      <th>2119-02-20 10:52:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 12:36:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:33:00</th>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:59:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 20:43:00</th>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-04 20:55:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-06 15:29:00</th>\n",
+       "      <td>1.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>177451 rows × 6 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      lactate                                        \n",
+       "status                       known         unknown                        \n",
+       "variable_type                   qn              qn                nom     \n",
+       "units                       mmol/L        no_units           no_units     \n",
+       "description                  50813 225668      818 1531 50813(mmol/L)  818\n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:32:00     1.9    NaN      NaN  NaN           NaN  NaN\n",
+       "100003 2150-04-17 19:12:00     1.1    1.1      NaN  NaN           NaN  NaN\n",
+       "100006 2108-04-08 10:58:00     4.5    NaN      4.5  NaN           NaN  NaN\n",
+       "100007 2145-03-31 00:44:00     3.1    NaN      NaN  NaN           NaN  NaN\n",
+       "       2145-04-02 14:10:00     1.9    NaN      NaN  NaN           NaN  NaN\n",
+       "100009 2162-05-17 13:19:00     1.1    1.1      NaN  NaN           NaN  NaN\n",
+       "       2162-05-17 17:14:00     1.5    1.5      NaN  NaN           NaN  NaN\n",
+       "100010 2109-12-10 10:25:00     0.6    NaN      NaN  NaN           NaN  NaN\n",
+       "       2109-12-10 12:11:00     0.9    NaN      NaN  NaN           NaN  NaN\n",
+       "       2109-12-10 13:05:00     1.0    NaN      NaN  NaN           NaN  NaN\n",
+       "       2109-12-10 13:58:00     0.8    NaN      NaN  NaN           NaN  NaN\n",
+       "100011 2177-08-29 04:44:00     3.8    NaN      NaN  NaN           NaN  NaN\n",
+       "       2177-08-29 06:55:00     2.3    2.3      NaN  NaN           NaN  NaN\n",
+       "100012 2177-03-14 07:38:00     2.3    NaN      NaN  NaN           NaN  NaN\n",
+       "       2177-03-14 11:42:00     2.5    2.5      NaN  NaN           NaN  NaN\n",
+       "       2177-03-15 08:05:00     2.1    2.1      NaN  NaN           NaN  NaN\n",
+       "       2177-03-15 14:01:00     2.6    2.6      NaN  NaN           NaN  NaN\n",
+       "       2177-03-15 21:42:00     1.8    1.8      NaN  NaN           NaN  NaN\n",
+       "100016 2188-05-24 12:00:00     2.0    NaN      NaN  NaN           NaN  NaN\n",
+       "100017 2103-03-11 05:10:00     1.1    NaN      1.1  NaN           NaN  NaN\n",
+       "100018 2176-08-29 15:29:00     1.3    NaN      NaN  NaN           NaN  NaN\n",
+       "       2176-08-30 09:23:00     0.9    0.9      NaN  NaN           NaN  NaN\n",
+       "       2176-08-30 10:19:00     1.0    1.0      NaN  NaN           NaN  NaN\n",
+       "       2176-08-30 11:29:00     0.9    0.9      NaN  NaN           NaN  NaN\n",
+       "       2176-08-30 12:40:00     1.1    1.1      NaN  NaN           NaN  NaN\n",
+       "100020 2142-11-30 21:54:00     1.1    NaN      NaN  NaN           NaN  NaN\n",
+       "       2142-12-03 00:17:00     1.0    NaN      NaN  NaN           NaN  NaN\n",
+       "100024 2170-09-19 10:25:00     1.4    1.4      NaN  NaN           NaN  NaN\n",
+       "       2170-09-19 16:33:00     2.6    2.6      NaN  NaN           NaN  NaN\n",
+       "       2170-09-20 02:04:00     3.2    3.2      NaN  NaN           NaN  NaN\n",
+       "...                            ...    ...      ...  ...           ...  ...\n",
+       "199976 2182-02-14 11:15:00     0.8    NaN      0.8  NaN           NaN  NaN\n",
+       "       2182-02-16 03:57:00     0.8    NaN      0.8  NaN           NaN  NaN\n",
+       "       2182-02-19 03:59:00     0.8    NaN      0.8  NaN           NaN  NaN\n",
+       "       2182-02-20 03:31:00     0.7    NaN      0.7  NaN           NaN  NaN\n",
+       "       2182-02-21 04:55:00     0.9    NaN      0.9  NaN           NaN  NaN\n",
+       "199979 2182-02-06 09:17:00     1.0    NaN      NaN  NaN           NaN  NaN\n",
+       "       2182-02-06 14:16:00     3.8    3.8      NaN  NaN           NaN  NaN\n",
+       "199981 2110-09-24 16:34:00     1.1    NaN      1.1  1.1           NaN  NaN\n",
+       "       2110-09-24 20:09:00     1.0    NaN      1.0  1.0           NaN  NaN\n",
+       "       2110-09-25 06:10:00     1.0    NaN      1.0  1.0           NaN  NaN\n",
+       "199987 2175-05-19 16:30:00     2.3    NaN      NaN  NaN           NaN  NaN\n",
+       "199988 2169-01-24 12:48:00     1.0    NaN      NaN  NaN           NaN  NaN\n",
+       "       2169-02-07 01:35:00     1.6    NaN      1.6  NaN           NaN  NaN\n",
+       "       2169-02-07 11:18:00     1.0    NaN      1.0  NaN           NaN  NaN\n",
+       "       2169-02-07 16:43:00     1.0    NaN      1.0  NaN           NaN  NaN\n",
+       "       2169-02-07 22:35:00     1.1    NaN      1.1  NaN           NaN  NaN\n",
+       "       2169-02-10 05:33:00     1.4    NaN      NaN  NaN           NaN  NaN\n",
+       "199993 2161-11-12 23:14:00     0.9    NaN      0.9  NaN           NaN  NaN\n",
+       "       2161-11-13 03:46:00     0.9    NaN      0.9  NaN           NaN  NaN\n",
+       "199994 2188-07-07 21:23:00     1.0    NaN      1.0  NaN           NaN  NaN\n",
+       "       2188-07-08 03:09:00     0.7    NaN      0.7  NaN           NaN  NaN\n",
+       "       2188-07-08 04:13:00     0.6    NaN      0.6  NaN           NaN  NaN\n",
+       "       2188-07-08 06:20:00     0.7    NaN      0.7  NaN           NaN  NaN\n",
+       "199998 2119-02-20 10:52:00     1.1    1.1      1.1  1.1           NaN  NaN\n",
+       "       2119-02-20 12:36:00     1.9    1.9      1.9  1.9           NaN  NaN\n",
+       "       2119-02-20 13:33:00     2.0    2.0      2.0  2.0           NaN  NaN\n",
+       "       2119-02-20 13:59:00     2.6    2.6      2.6  2.6           NaN  NaN\n",
+       "       2119-02-20 20:43:00     1.3    1.3      1.3  1.3           NaN  NaN\n",
+       "199999 2136-04-04 20:55:00     1.9    NaN      NaN  NaN           NaN  NaN\n",
+       "       2136-04-06 15:29:00     1.8    NaN      NaN  NaN           NaN  NaN\n",
+       "\n",
+       "[177451 rows x 6 columns]"
+      ]
+     },
+     "execution_count": 216,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_cleaned"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "df_invalid = df_cleaned.loc[:,df_cleaned.columns.get_level_values('status') == 'unknown']"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "df_invalid.columns.set_labels([0]*df_invalid.columns.size,level='status',inplace=True)\n",
+    "df_invalid.columns.set_levels(['known'],level='status',inplace=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"10\" halign=\"left\">lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"6\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">nom</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">no_units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">no_units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">mmol/L</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">no_units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>818</th>\n",
+       "      <th>1531</th>\n",
+       "      <th>50813(mmol/L)</th>\n",
+       "      <th>818</th>\n",
+       "      <th>50813</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>818</th>\n",
+       "      <th>1531</th>\n",
+       "      <th>50813(mmol/L)</th>\n",
+       "      <th>818</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>100001</th>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100003</th>\n",
+       "      <th>2150-04-17 19:12:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100006</th>\n",
+       "      <th>2108-04-08 10:58:00</th>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100007</th>\n",
+       "      <th>2145-03-31 00:44:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2145-04-02 14:10:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100009</th>\n",
+       "      <th>2162-05-17 13:19:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2162-05-17 17:14:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.5</td>\n",
+       "      <td>1.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">100010</th>\n",
+       "      <th>2109-12-10 10:25:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 12:11:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:05:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:58:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100011</th>\n",
+       "      <th>2177-08-29 04:44:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-08-29 06:55:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.3</td>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100012</th>\n",
+       "      <th>2177-03-14 07:38:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-14 11:42:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.5</td>\n",
+       "      <td>2.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 08:05:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.1</td>\n",
+       "      <td>2.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 14:01:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 21:42:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100016</th>\n",
+       "      <th>2188-05-24 12:00:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100017</th>\n",
+       "      <th>2103-03-11 05:10:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100018</th>\n",
+       "      <th>2176-08-29 15:29:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 09:23:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 10:19:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 11:29:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 12:40:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100020</th>\n",
+       "      <th>2142-11-30 21:54:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2142-12-03 00:17:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100024</th>\n",
+       "      <th>2170-09-19 10:25:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.4</td>\n",
+       "      <td>1.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-19 16:33:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-20 02:04:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.2</td>\n",
+       "      <td>3.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199976</th>\n",
+       "      <th>2182-02-14 11:15:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-16 03:57:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-19 03:59:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-20 03:31:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-21 04:55:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199979</th>\n",
+       "      <th>2182-02-06 09:17:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-06 14:16:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.8</td>\n",
+       "      <td>3.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">199981</th>\n",
+       "      <th>2110-09-24 16:34:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-24 20:09:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-25 06:10:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>199987</th>\n",
+       "      <th>2175-05-19 16:30:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"6\" valign=\"top\">199988</th>\n",
+       "      <th>2169-01-24 12:48:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 01:35:00</th>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 11:18:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 16:43:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 22:35:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-10 05:33:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199993</th>\n",
+       "      <th>2161-11-12 23:14:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2161-11-13 03:46:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">199994</th>\n",
+       "      <th>2188-07-07 21:23:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 03:09:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 04:13:00</th>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 06:20:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199998</th>\n",
+       "      <th>2119-02-20 10:52:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 12:36:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:33:00</th>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:59:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 20:43:00</th>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-04 20:55:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-06 15:29:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>177451 rows × 10 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                       lactate                                        \\\n",
+       "status                        known                                         \n",
+       "variable_type                    qn                nom          qn          \n",
+       "units                      no_units           no_units      mmol/L          \n",
+       "description                     818 1531 50813(mmol/L)  818  50813 225668   \n",
+       "id     datetime                                                             \n",
+       "100001 2117-09-11 09:32:00      NaN  NaN           NaN  NaN    1.9    NaN   \n",
+       "100003 2150-04-17 19:12:00      NaN  NaN           NaN  NaN    1.1    1.1   \n",
+       "100006 2108-04-08 10:58:00      4.5  NaN           NaN  NaN    4.5    NaN   \n",
+       "100007 2145-03-31 00:44:00      NaN  NaN           NaN  NaN    3.1    NaN   \n",
+       "       2145-04-02 14:10:00      NaN  NaN           NaN  NaN    1.9    NaN   \n",
+       "100009 2162-05-17 13:19:00      NaN  NaN           NaN  NaN    1.1    1.1   \n",
+       "       2162-05-17 17:14:00      NaN  NaN           NaN  NaN    1.5    1.5   \n",
+       "100010 2109-12-10 10:25:00      NaN  NaN           NaN  NaN    0.6    NaN   \n",
+       "       2109-12-10 12:11:00      NaN  NaN           NaN  NaN    0.9    NaN   \n",
+       "       2109-12-10 13:05:00      NaN  NaN           NaN  NaN    1.0    NaN   \n",
+       "       2109-12-10 13:58:00      NaN  NaN           NaN  NaN    0.8    NaN   \n",
+       "100011 2177-08-29 04:44:00      NaN  NaN           NaN  NaN    3.8    NaN   \n",
+       "       2177-08-29 06:55:00      NaN  NaN           NaN  NaN    2.3    2.3   \n",
+       "100012 2177-03-14 07:38:00      NaN  NaN           NaN  NaN    2.3    NaN   \n",
+       "       2177-03-14 11:42:00      NaN  NaN           NaN  NaN    2.5    2.5   \n",
+       "       2177-03-15 08:05:00      NaN  NaN           NaN  NaN    2.1    2.1   \n",
+       "       2177-03-15 14:01:00      NaN  NaN           NaN  NaN    2.6    2.6   \n",
+       "       2177-03-15 21:42:00      NaN  NaN           NaN  NaN    1.8    1.8   \n",
+       "100016 2188-05-24 12:00:00      NaN  NaN           NaN  NaN    2.0    NaN   \n",
+       "100017 2103-03-11 05:10:00      1.1  NaN           NaN  NaN    1.1    NaN   \n",
+       "100018 2176-08-29 15:29:00      NaN  NaN           NaN  NaN    1.3    NaN   \n",
+       "       2176-08-30 09:23:00      NaN  NaN           NaN  NaN    0.9    0.9   \n",
+       "       2176-08-30 10:19:00      NaN  NaN           NaN  NaN    1.0    1.0   \n",
+       "       2176-08-30 11:29:00      NaN  NaN           NaN  NaN    0.9    0.9   \n",
+       "       2176-08-30 12:40:00      NaN  NaN           NaN  NaN    1.1    1.1   \n",
+       "100020 2142-11-30 21:54:00      NaN  NaN           NaN  NaN    1.1    NaN   \n",
+       "       2142-12-03 00:17:00      NaN  NaN           NaN  NaN    1.0    NaN   \n",
+       "100024 2170-09-19 10:25:00      NaN  NaN           NaN  NaN    1.4    1.4   \n",
+       "       2170-09-19 16:33:00      NaN  NaN           NaN  NaN    2.6    2.6   \n",
+       "       2170-09-20 02:04:00      NaN  NaN           NaN  NaN    3.2    3.2   \n",
+       "...                             ...  ...           ...  ...    ...    ...   \n",
+       "199976 2182-02-14 11:15:00      0.8  NaN           NaN  NaN    0.8    NaN   \n",
+       "       2182-02-16 03:57:00      0.8  NaN           NaN  NaN    0.8    NaN   \n",
+       "       2182-02-19 03:59:00      0.8  NaN           NaN  NaN    0.8    NaN   \n",
+       "       2182-02-20 03:31:00      0.7  NaN           NaN  NaN    0.7    NaN   \n",
+       "       2182-02-21 04:55:00      0.9  NaN           NaN  NaN    0.9    NaN   \n",
+       "199979 2182-02-06 09:17:00      NaN  NaN           NaN  NaN    1.0    NaN   \n",
+       "       2182-02-06 14:16:00      NaN  NaN           NaN  NaN    3.8    3.8   \n",
+       "199981 2110-09-24 16:34:00      1.1  1.1           NaN  NaN    1.1    NaN   \n",
+       "       2110-09-24 20:09:00      1.0  1.0           NaN  NaN    1.0    NaN   \n",
+       "       2110-09-25 06:10:00      1.0  1.0           NaN  NaN    1.0    NaN   \n",
+       "199987 2175-05-19 16:30:00      NaN  NaN           NaN  NaN    2.3    NaN   \n",
+       "199988 2169-01-24 12:48:00      NaN  NaN           NaN  NaN    1.0    NaN   \n",
+       "       2169-02-07 01:35:00      1.6  NaN           NaN  NaN    1.6    NaN   \n",
+       "       2169-02-07 11:18:00      1.0  NaN           NaN  NaN    1.0    NaN   \n",
+       "       2169-02-07 16:43:00      1.0  NaN           NaN  NaN    1.0    NaN   \n",
+       "       2169-02-07 22:35:00      1.1  NaN           NaN  NaN    1.1    NaN   \n",
+       "       2169-02-10 05:33:00      NaN  NaN           NaN  NaN    1.4    NaN   \n",
+       "199993 2161-11-12 23:14:00      0.9  NaN           NaN  NaN    0.9    NaN   \n",
+       "       2161-11-13 03:46:00      0.9  NaN           NaN  NaN    0.9    NaN   \n",
+       "199994 2188-07-07 21:23:00      1.0  NaN           NaN  NaN    1.0    NaN   \n",
+       "       2188-07-08 03:09:00      0.7  NaN           NaN  NaN    0.7    NaN   \n",
+       "       2188-07-08 04:13:00      0.6  NaN           NaN  NaN    0.6    NaN   \n",
+       "       2188-07-08 06:20:00      0.7  NaN           NaN  NaN    0.7    NaN   \n",
+       "199998 2119-02-20 10:52:00      1.1  1.1           NaN  NaN    1.1    1.1   \n",
+       "       2119-02-20 12:36:00      1.9  1.9           NaN  NaN    1.9    1.9   \n",
+       "       2119-02-20 13:33:00      2.0  2.0           NaN  NaN    2.0    2.0   \n",
+       "       2119-02-20 13:59:00      2.6  2.6           NaN  NaN    2.6    2.6   \n",
+       "       2119-02-20 20:43:00      1.3  1.3           NaN  NaN    1.3    1.3   \n",
+       "199999 2136-04-04 20:55:00      NaN  NaN           NaN  NaN    1.9    NaN   \n",
+       "       2136-04-06 15:29:00      NaN  NaN           NaN  NaN    1.8    NaN   \n",
+       "\n",
+       "label                                                        \n",
+       "status                      unknown                          \n",
+       "variable_type                    qn                nom       \n",
+       "units                      no_units           no_units       \n",
+       "description                     818 1531 50813(mmol/L)  818  \n",
+       "id     datetime                                              \n",
+       "100001 2117-09-11 09:32:00      NaN  NaN           NaN  NaN  \n",
+       "100003 2150-04-17 19:12:00      NaN  NaN           NaN  NaN  \n",
+       "100006 2108-04-08 10:58:00      4.5  NaN           NaN  NaN  \n",
+       "100007 2145-03-31 00:44:00      NaN  NaN           NaN  NaN  \n",
+       "       2145-04-02 14:10:00      NaN  NaN           NaN  NaN  \n",
+       "100009 2162-05-17 13:19:00      NaN  NaN           NaN  NaN  \n",
+       "       2162-05-17 17:14:00      NaN  NaN           NaN  NaN  \n",
+       "100010 2109-12-10 10:25:00      NaN  NaN           NaN  NaN  \n",
+       "       2109-12-10 12:11:00      NaN  NaN           NaN  NaN  \n",
+       "       2109-12-10 13:05:00      NaN  NaN           NaN  NaN  \n",
+       "       2109-12-10 13:58:00      NaN  NaN           NaN  NaN  \n",
+       "100011 2177-08-29 04:44:00      NaN  NaN           NaN  NaN  \n",
+       "       2177-08-29 06:55:00      NaN  NaN           NaN  NaN  \n",
+       "100012 2177-03-14 07:38:00      NaN  NaN           NaN  NaN  \n",
+       "       2177-03-14 11:42:00      NaN  NaN           NaN  NaN  \n",
+       "       2177-03-15 08:05:00      NaN  NaN           NaN  NaN  \n",
+       "       2177-03-15 14:01:00      NaN  NaN           NaN  NaN  \n",
+       "       2177-03-15 21:42:00      NaN  NaN           NaN  NaN  \n",
+       "100016 2188-05-24 12:00:00      NaN  NaN           NaN  NaN  \n",
+       "100017 2103-03-11 05:10:00      1.1  NaN           NaN  NaN  \n",
+       "100018 2176-08-29 15:29:00      NaN  NaN           NaN  NaN  \n",
+       "       2176-08-30 09:23:00      NaN  NaN           NaN  NaN  \n",
+       "       2176-08-30 10:19:00      NaN  NaN           NaN  NaN  \n",
+       "       2176-08-30 11:29:00      NaN  NaN           NaN  NaN  \n",
+       "       2176-08-30 12:40:00      NaN  NaN           NaN  NaN  \n",
+       "100020 2142-11-30 21:54:00      NaN  NaN           NaN  NaN  \n",
+       "       2142-12-03 00:17:00      NaN  NaN           NaN  NaN  \n",
+       "100024 2170-09-19 10:25:00      NaN  NaN           NaN  NaN  \n",
+       "       2170-09-19 16:33:00      NaN  NaN           NaN  NaN  \n",
+       "       2170-09-20 02:04:00      NaN  NaN           NaN  NaN  \n",
+       "...                             ...  ...           ...  ...  \n",
+       "199976 2182-02-14 11:15:00      0.8  NaN           NaN  NaN  \n",
+       "       2182-02-16 03:57:00      0.8  NaN           NaN  NaN  \n",
+       "       2182-02-19 03:59:00      0.8  NaN           NaN  NaN  \n",
+       "       2182-02-20 03:31:00      0.7  NaN           NaN  NaN  \n",
+       "       2182-02-21 04:55:00      0.9  NaN           NaN  NaN  \n",
+       "199979 2182-02-06 09:17:00      NaN  NaN           NaN  NaN  \n",
+       "       2182-02-06 14:16:00      NaN  NaN           NaN  NaN  \n",
+       "199981 2110-09-24 16:34:00      1.1  1.1           NaN  NaN  \n",
+       "       2110-09-24 20:09:00      1.0  1.0           NaN  NaN  \n",
+       "       2110-09-25 06:10:00      1.0  1.0           NaN  NaN  \n",
+       "199987 2175-05-19 16:30:00      NaN  NaN           NaN  NaN  \n",
+       "199988 2169-01-24 12:48:00      NaN  NaN           NaN  NaN  \n",
+       "       2169-02-07 01:35:00      1.6  NaN           NaN  NaN  \n",
+       "       2169-02-07 11:18:00      1.0  NaN           NaN  NaN  \n",
+       "       2169-02-07 16:43:00      1.0  NaN           NaN  NaN  \n",
+       "       2169-02-07 22:35:00      1.1  NaN           NaN  NaN  \n",
+       "       2169-02-10 05:33:00      NaN  NaN           NaN  NaN  \n",
+       "199993 2161-11-12 23:14:00      0.9  NaN           NaN  NaN  \n",
+       "       2161-11-13 03:46:00      0.9  NaN           NaN  NaN  \n",
+       "199994 2188-07-07 21:23:00      1.0  NaN           NaN  NaN  \n",
+       "       2188-07-08 03:09:00      0.7  NaN           NaN  NaN  \n",
+       "       2188-07-08 04:13:00      0.6  NaN           NaN  NaN  \n",
+       "       2188-07-08 06:20:00      0.7  NaN           NaN  NaN  \n",
+       "199998 2119-02-20 10:52:00      1.1  1.1           NaN  NaN  \n",
+       "       2119-02-20 12:36:00      1.9  1.9           NaN  NaN  \n",
+       "       2119-02-20 13:33:00      2.0  2.0           NaN  NaN  \n",
+       "       2119-02-20 13:59:00      2.6  2.6           NaN  NaN  \n",
+       "       2119-02-20 20:43:00      1.3  1.3           NaN  NaN  \n",
+       "199999 2136-04-04 20:55:00      NaN  NaN           NaN  NaN  \n",
+       "       2136-04-06 15:29:00      NaN  NaN           NaN  NaN  \n",
+       "\n",
+       "[177451 rows x 10 columns]"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_invalid.join(df_cleaned, how='outer')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 71,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "df = utils.open_df('data/mimic_data','transformed/{}'.format(label))\n",
+    "df_cleaned = pipeline.transform(df)\n",
+    "utils.data_loss(df,df_cleaned)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 72,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(113L, 0, '0.0%')"
+      ]
+     },
+     "execution_count": 72,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": []
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Secondary/optional transformation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 99,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload (transformers)\n",
+    "pipeline1 = Pipeline([\n",
+    "        ('combine_like_columns',transformers.combine_like_cols()),\n",
+    "        ('quantitative_vales_only',transformers.quantitative_only()),\n",
+    "        ('known_col_only',transformers.known_col_only())\n",
+    "    ])\n",
+    "\n",
+    "pipeline2 = Pipeline([\n",
+    "        ('combine_like_columns',transformers.combine_like_cols()),\n",
+    "        ('max_col',transformers.max_col_only()),\n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 74,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(205349L, 20, '0.0583%')"
+      ]
+     },
+     "execution_count": 74,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_final = pipeline1.transform(df_cleaned)\n",
+    "utils.data_loss(df,df_final)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 75,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(205349L, 20, '0.0583%')"
+      ]
+     },
+     "execution_count": 75,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_final = pipeline2.transform(df_cleaned)\n",
+    "utils.data_loss(df,df_final)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Handle Categorical columns\n",
+    "\n",
+    "0. Standardize category lists\n",
+    "1. Make sure ordinal & nominal within category list?\n",
+    "2. Explode nominal\n",
+    "3. Ordinal to numeric"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def make_cat_dict(label,cat_codes):\n",
+    "    df = utils.open_df(hdf5_fname, 'transformed/{}'.format(label))\n",
+    "    mimic_cats = df.iloc[:,0].value_counts().sort_index().index.astype(str).tolist()\n",
+    "    return dict(zip(mimic_cats,cat_codes))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "category_map={}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>val_numeric</th>\n",
+       "      <th>val_text</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>category_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>1</td>\n",
+       "      <td>No motor response</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>2</td>\n",
+       "      <td>Extension to pain</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>3</td>\n",
+       "      <td>Flexion to pain</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>4</td>\n",
+       "      <td>Withdrawal from pain</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>5</td>\n",
+       "      <td>Localizing pain</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>6</td>\n",
+       "      <td>Obeys commands</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>1</td>\n",
+       "      <td>No eye opening</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>2</td>\n",
+       "      <td>Eye opening to pain</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>3</td>\n",
+       "      <td>Eye opening to verbal command</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>4</td>\n",
+       "      <td>Eyes open spontaneously</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>1</td>\n",
+       "      <td>No verbal response (&gt;2 yrs); no vocal response...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>2</td>\n",
+       "      <td>Incomprehensible sounds</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>3</td>\n",
+       "      <td>Inappropriate words</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>4</td>\n",
+       "      <td>Confused</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>14</th>\n",
+       "      <td>5</td>\n",
+       "      <td>Oriented</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "             val_numeric                                           val_text\n",
+       "category_id                                                                \n",
+       "0                      1                                 No motor response \n",
+       "1                      2                                  Extension to pain\n",
+       "2                      3                                    Flexion to pain\n",
+       "3                      4                            Withdrawal from pain   \n",
+       "4                      5                                    Localizing pain\n",
+       "5                      6                                     Obeys commands\n",
+       "6                      1                                     No eye opening\n",
+       "7                      2                                Eye opening to pain\n",
+       "8                      3                      Eye opening to verbal command\n",
+       "9                      4                            Eyes open spontaneously\n",
+       "10                     1  No verbal response (>2 yrs); no vocal response...\n",
+       "11                     2                            Incomprehensible sounds\n",
+       "12                     3                                Inappropriate words\n",
+       "13                     4                                           Confused\n",
+       "14                     5                                           Oriented"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "data_dict.tables.categories"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 62,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "label = data_dict.labels.GLASGOW_COMA_SCALE_MOTOR\n",
+    "category_map[label] = make_cat_dict(label,range(0,6))\n",
+    "label = data_dict.labels.GLASGOW_COMA_SCALE_EYE_OPENING\n",
+    "category_map[label] = make_cat_dict(label,range(6,10))\n",
+    "label = data_dict.labels.GLASGOW_COMA_SCALE_VERBAL\n",
+    "category_map[label] = make_cat_dict(label,[10] + range(10,15))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 63,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'glasgow coma scale eye opening': {'1 No Response': 6,\n",
+       "  '2 To pain': 7,\n",
+       "  '3 To speech': 8,\n",
+       "  '4 Spontaneously': 9},\n",
+       " 'glasgow coma scale motor': {'1 No Response': 0,\n",
+       "  '2 Abnorm extensn': 1,\n",
+       "  '3 Abnorm flexion': 2,\n",
+       "  '4 Flex-withdraws': 3,\n",
+       "  '5 Localizes Pain': 4,\n",
+       "  '6 Obeys Commands': 5},\n",
+       " 'glasgow coma scale verbal': {'1 No Response': 10,\n",
+       "  '1.0 ET/Trach': 10,\n",
+       "  '2 Incomp sounds': 11,\n",
+       "  '3 Inapprop words': 12,\n",
+       "  '4 Confused': 13,\n",
+       "  '5 Oriented': 14}}"
+      ]
+     },
+     "execution_count": 63,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "category_map"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 57,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<module 'transformers' from 'transformers.pyc'>"
+      ]
+     },
+     "execution_count": 57,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "reload(utils)\n",
+    "reload(transformers)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 58,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>glasgow coma scale verbal</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>ord</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>723</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>1.0 ET/Trach</th>\n",
+       "      <td>444357</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5 Oriented</th>\n",
+       "      <td>379668</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4 Confused</th>\n",
+       "      <td>82434</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1 No Response</th>\n",
+       "      <td>20836</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2 Incomp sounds</th>\n",
+       "      <td>18007</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3 Inapprop words</th>\n",
+       "      <td>5611</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label            glasgow coma scale verbal\n",
+       "status                               known\n",
+       "variable_type                          ord\n",
+       "units                             no_units\n",
+       "description                            723\n",
+       "1.0 ET/Trach                        444357\n",
+       "5 Oriented                          379668\n",
+       "4 Confused                           82434\n",
+       "1 No Response                        20836\n",
+       "2 Incomp sounds                      18007\n",
+       "3 Inapprop words                      5611"
+      ]
+     },
+     "execution_count": 58,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_gcs = utils.open_df(hdf5_fname, 'transformed/{}'.format(data_dict.labels.GLASGOW_COMA_SCALE_VERBAL))\n",
+    "df_gcs = standard_pipeline.transform(df_gcs)\n",
+    "df_gcs.apply(lambda x: x.value_counts())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 59,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>glasgow coma scale verbal</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>ord</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>723</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>465193</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5 Oriented</th>\n",
+       "      <td>379668</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>82434</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>18007</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>5611</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         glasgow coma scale verbal\n",
+       "status                            known\n",
+       "variable_type                       ord\n",
+       "units                          no_units\n",
+       "description                         723\n",
+       "1                                465193\n",
+       "5 Oriented                       379668\n",
+       "4                                 82434\n",
+       "2                                 18007\n",
+       "3                                  5611"
+      ]
+     },
+     "execution_count": 59,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "transformer = transformers.standardize_categories(data_dict,category_map,use_numeric=True)\n",
+    "df_gcs = transformer.transform(df_gcs)\n",
+    "df_gcs.apply(lambda x: x.value_counts())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 60,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">glasgow coma scale verbal</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "      <th>unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>ord</th>\n",
+       "      <th>nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>723</th>\n",
+       "      <th>723</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>465193.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>18007.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>5611.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>82434.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5 Oriented</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>379668.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         glasgow coma scale verbal          \n",
+       "status                            known   unknown\n",
+       "variable_type                       ord       nom\n",
+       "units                          no_units  no_units\n",
+       "description                         723       723\n",
+       "1                              465193.0       NaN\n",
+       "2                               18007.0       NaN\n",
+       "3                                5611.0       NaN\n",
+       "4                               82434.0       NaN\n",
+       "5 Oriented                          NaN  379668.0"
+      ]
+     },
+     "execution_count": 60,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "transformer2 = transformers.split_bad_categories(data_dict,use_numeric=True)\n",
+    "transformer2.transform(df_gcs).apply(lambda x: x.value_counts())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Unified pipeline"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import icu_data_defs\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "import transformers\n",
+    "from units import MedicalUreg\n",
+    "from constants import variable_type\n",
+    "import utils\n",
+    "import mimic\n",
+    "import warnings\n",
+    "warnings.filterwarnings('ignore')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(transformers)\n",
+    "reload(utils)\n",
+    "reload(mimic)\n",
+    "hdf5_fname = 'data/mimic_data'\n",
+    "\n",
+    "#get all labels\n",
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n",
+    "ureg = MedicalUreg('config/medical_units.txt')\n",
+    "\n",
+    "agg_func = lambda x:x.iloc[0]\n",
+    "var_types_to_keep = [variable_type.QUANTITATIVE,variable_type.ORDINAL]\n",
+    "category_map = {\n",
+    "    data_dict.labels.GLASGOW_COMA_SCALE_EYE_OPENING: {\n",
+    "        '1 No Response': 6,\n",
+    "        '2 To pain': 7,\n",
+    "        '3 To speech': 8,\n",
+    "        '4 Spontaneously': 9\n",
+    "    },\n",
+    " data_dict.labels.GLASGOW_COMA_SCALE_MOTOR: {\n",
+    "        '1 No Response': 0,\n",
+    "        '2 Abnorm extensn': 1,\n",
+    "        '3 Abnorm flexion': 2,\n",
+    "        '4 Flex-withdraws': 3,\n",
+    "        '5 Localizes Pain': 4,\n",
+    "        '6 Obeys Commands': 5\n",
+    "    },\n",
+    " data_dict.labels.GLASGOW_COMA_SCALE_VERBAL: {\n",
+    "        '1 No Response': 10,\n",
+    "        '1.0 ET/Trach': 10,\n",
+    "        '2 Incomp sounds': 11,\n",
+    "        '3 Inapprop words': 12,\n",
+    "        '4 Confused': 13,\n",
+    "        '5 Oriented':14\n",
+    "    }\n",
+    "}\n",
+    "\n",
+    "mimic_transform = Pipeline([\n",
+    "    ('clean',mimic.clean_extract()),\n",
+    "    ('unstack',mimic.unstacker()),\n",
+    "    ('add_level',transformers.add_level(None,'label',axis=1)),\n",
+    "])\n",
+    "\n",
+    "standard_pipeline = Pipeline([\n",
+    "        ('drop_small_columns',transformers.remove_small_columns(threshold=5)),\n",
+    "        ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func)),\n",
+    "        ('split_dtype',transformers.split_dtype()),\n",
+    "        ('standardize_columns',transformers.standardize_columns(data_dict,ureg)),\n",
+    "        ('standardize_categories',transformers.standardize_categories(data_dict,category_map)),\n",
+    "        ('split_bad_categories',transformers.split_bad_categories(data_dict))\n",
+    "    ])\n",
+    "\n",
+    "cleaning_pipeline = Pipeline([\n",
+    "        ('drop_small_columns',transformers.remove_small_columns(threshold=50)),\n",
+    "        ('combine_like_columns',transformers.combine_like_cols()),\n",
+    "        ('quantitative_only',transformers.filter_var_type(var_types_to_keep)),\n",
+    "        ('known_col_only',transformers.known_col_only()),\n",
+    "#         ('max_col',transformers.max_col_only())        \n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>817373.000000</td>\n",
+       "      <td>817373</td>\n",
+       "      <td>771272.000000</td>\n",
+       "      <td>817373</td>\n",
+       "      <td>817373.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>536890</td>\n",
+       "      <td>446614.000000</td>\n",
+       "      <td>6</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2159-09-30 01:00:00</td>\n",
+       "      <td>99.999996</td>\n",
+       "      <td>mL/hour</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>9</td>\n",
+       "      <td>25385.000000</td>\n",
+       "      <td>719922</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>first</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2100-06-08 04:23:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>last</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2209-08-07 14:27:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>150437.603989</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>222346.358593</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>28720.645234</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>23242.543767</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>100001.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4647.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>125824.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>225158.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>150715.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>225158.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>175466.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>225158.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>199984.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>225158.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                   id             datetime          value    units  \\\n",
+       "count   817373.000000               817373  771272.000000   817373   \n",
+       "unique            NaN               536890  446614.000000        6   \n",
+       "top               NaN  2159-09-30 01:00:00      99.999996  mL/hour   \n",
+       "freq              NaN                    9   25385.000000   719922   \n",
+       "first             NaN  2100-06-08 04:23:00            NaN      NaN   \n",
+       "last              NaN  2209-08-07 14:27:00            NaN      NaN   \n",
+       "mean    150437.603989                  NaN            NaN      NaN   \n",
+       "std      28720.645234                  NaN            NaN      NaN   \n",
+       "min     100001.000000                  NaN            NaN      NaN   \n",
+       "25%     125824.000000                  NaN            NaN      NaN   \n",
+       "50%     150715.000000                  NaN            NaN      NaN   \n",
+       "75%     175466.000000                  NaN            NaN      NaN   \n",
+       "max     199984.000000                  NaN            NaN      NaN   \n",
+       "\n",
+       "               itemid  \n",
+       "count   817373.000000  \n",
+       "unique            NaN  \n",
+       "top               NaN  \n",
+       "freq              NaN  \n",
+       "first             NaN  \n",
+       "last              NaN  \n",
+       "mean    222346.358593  \n",
+       "std      23242.543767  \n",
+       "min       4647.000000  \n",
+       "25%     225158.000000  \n",
+       "50%     225158.000000  \n",
+       "75%     225158.000000  \n",
+       "max     225158.000000  "
+      ]
+     },
+     "execution_count": 26,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "label = 'normal saline'\n",
+    "df = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n",
+    "df.describe(include='all')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"17\" halign=\"left\">normal saline</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mL/hour</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>ml</th>\n",
+       "      <th>mL/hour</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th>ml</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>ml</th>\n",
+       "      <th>mL/min</th>\n",
+       "      <th>L</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">ml</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th>ml</th>\n",
+       "      <th>mL/hour</th>\n",
+       "      <th>ml</th>\n",
+       "      <th>mL/hour</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>30190</th>\n",
+       "      <th>30190</th>\n",
+       "      <th>30190</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>30190</th>\n",
+       "      <th>4647</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>6190</th>\n",
+       "      <th>44053</th>\n",
+       "      <th>44053</th>\n",
+       "      <th>44440</th>\n",
+       "      <th>44440</th>\n",
+       "      <th>41913</th>\n",
+       "      <th>41913</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>719400.000000</td>\n",
+       "      <td>39402.0</td>\n",
+       "      <td>5167.0</td>\n",
+       "      <td>259.0</td>\n",
+       "      <td>160.0</td>\n",
+       "      <td>6730.000000</td>\n",
+       "      <td>50.0</td>\n",
+       "      <td>8</td>\n",
+       "      <td>80.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>443511.000000</td>\n",
+       "      <td>147.0</td>\n",
+       "      <td>243.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>4233.000000</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>6.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>99.999996</td>\n",
+       "      <td>500.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>49.999999</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>given</td>\n",
+       "      <td>100.0</td>\n",
+       "      <td>1000.0</td>\n",
+       "      <td>given</td>\n",
+       "      <td>17.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>37.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>20.0</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>25193.000000</td>\n",
+       "      <td>11589.0</td>\n",
+       "      <td>651.0</td>\n",
+       "      <td>259.0</td>\n",
+       "      <td>160.0</td>\n",
+       "      <td>352.000000</td>\n",
+       "      <td>50.0</td>\n",
+       "      <td>8</td>\n",
+       "      <td>60.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label        normal saline                                                 \\\n",
+       "units              mL/hour       mL      ml mL/hour no_units           ml   \n",
+       "description         225158   225158  30190   30190    30190        225158   \n",
+       "count        719400.000000  39402.0  5167.0   259.0    160.0  6730.000000   \n",
+       "unique       443511.000000    147.0   243.0     1.0      1.0  4233.000000   \n",
+       "top              99.999996    500.0     1.0     0.0      0.0    49.999999   \n",
+       "freq          25193.000000  11589.0   651.0   259.0    160.0   352.000000   \n",
+       "\n",
+       "label                                                                   \\\n",
+       "units           mL     ml mL/min       L     ml        no_units     ml   \n",
+       "description 30190  4647   225158  225158 6190   44053    44053  44440    \n",
+       "count         50.0      8   80.0     1.0      1    3.0      2.0    5.0   \n",
+       "unique         1.0      1    6.0     1.0      1    2.0      1.0    2.0   \n",
+       "top            0.0  given  100.0  1000.0  given   17.0      0.0   37.0   \n",
+       "freq          50.0      8   60.0     1.0      1    2.0      2.0    3.0   \n",
+       "\n",
+       "label                               \n",
+       "units       mL/hour     ml mL/hour  \n",
+       "description  44440  41913   41913   \n",
+       "count           1.0    2.0     1.0  \n",
+       "unique          1.0    1.0     1.0  \n",
+       "top             0.0   20.0     0.0  \n",
+       "freq            1.0    2.0     1.0  "
+      ]
+     },
+     "execution_count": 27,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "mimic_transform.set_params(add_level__level_val=label)\n",
+    "df_tr = mimic_transform.transform(df)\n",
+    "df_tr.describe()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 33,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "((770238, 17), (504923, 9), 265320L, 4, '0.0202% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"9\" halign=\"left\">normal saline</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "      <th>unknown</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mL/hr</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">mL</th>\n",
+       "      <th>mL/min</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>225158(mL/hour)</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>30190(ml)</th>\n",
+       "      <th>30190(mL/hour)</th>\n",
+       "      <th>30190</th>\n",
+       "      <th>225158(ml)</th>\n",
+       "      <th>30190</th>\n",
+       "      <th>225158</th>\n",
+       "      <th>4647(ml)</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>456226.000000</td>\n",
+       "      <td>39261.000000</td>\n",
+       "      <td>5068.000000</td>\n",
+       "      <td>258.0</td>\n",
+       "      <td>157.0</td>\n",
+       "      <td>4844.000000</td>\n",
+       "      <td>50.0</td>\n",
+       "      <td>80.000000</td>\n",
+       "      <td>8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>given</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>75.669716</td>\n",
+       "      <td>471.560439</td>\n",
+       "      <td>4.255024</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>128.094818</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>103.312500</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>217.566524</td>\n",
+       "      <td>372.084861</td>\n",
+       "      <td>8.418981</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>260.186534</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>55.885358</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-906.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>6.000000</td>\n",
+       "      <td>200.000000</td>\n",
+       "      <td>0.850000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>9.310294</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>100.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>15.000000</td>\n",
+       "      <td>500.000000</td>\n",
+       "      <td>1.100000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>25.000000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>100.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>62.255889</td>\n",
+       "      <td>500.000000</td>\n",
+       "      <td>2.400000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>100.000001</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>100.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>51947.999400</td>\n",
+       "      <td>11000.000000</td>\n",
+       "      <td>117.000000</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>5000.000160</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>300.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label           normal saline                                            \\\n",
+       "status                  known                                             \n",
+       "variable_type              qn                                             \n",
+       "units                   mL/hr            mL                       mL/hr   \n",
+       "description   225158(mL/hour)        225158    30190(ml) 30190(mL/hour)   \n",
+       "count           456226.000000  39261.000000  5068.000000          258.0   \n",
+       "unique                    NaN           NaN          NaN            NaN   \n",
+       "top                       NaN           NaN          NaN            NaN   \n",
+       "freq                      NaN           NaN          NaN            NaN   \n",
+       "mean                75.669716    471.560439     4.255024            0.0   \n",
+       "std                217.566524    372.084861     8.418981            0.0   \n",
+       "min               -906.000000      0.000000     0.000000            0.0   \n",
+       "25%                  6.000000    200.000000     0.850000            0.0   \n",
+       "50%                 15.000000    500.000000     1.100000            0.0   \n",
+       "75%                 62.255889    500.000000     2.400000            0.0   \n",
+       "max              51947.999400  11000.000000   117.000000            0.0   \n",
+       "\n",
+       "label                                                           \n",
+       "status         unknown        known           unknown           \n",
+       "variable_type       qn           qn                qn      nom  \n",
+       "units         no_units           mL            mL/min no_units  \n",
+       "description      30190   225158(ml) 30190      225158 4647(ml)  \n",
+       "count            157.0  4844.000000  50.0   80.000000        8  \n",
+       "unique             NaN          NaN   NaN         NaN        1  \n",
+       "top                NaN          NaN   NaN         NaN    given  \n",
+       "freq               NaN          NaN   NaN         NaN        8  \n",
+       "mean               0.0   128.094818   0.0  103.312500      NaN  \n",
+       "std                0.0   260.186534   0.0   55.885358      NaN  \n",
+       "min                0.0     0.000000   0.0    0.500000      NaN  \n",
+       "25%                0.0     9.310294   0.0  100.000000      NaN  \n",
+       "50%                0.0    25.000000   0.0  100.000000      NaN  \n",
+       "75%                0.0   100.000001   0.0  100.000000      NaN  \n",
+       "max                0.0  5000.000160   0.0  300.000000      NaN  "
+      ]
+     },
+     "execution_count": 33,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_cln1 = standard_pipeline.transform(df_tr)\n",
+    "print utils.data_loss(df_tr,df_cln1)\n",
+    "df_cln1.describe(include='all')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 36,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "this step: ((504923, 9), (504874, 2), 295L, 1, '0.0051% records')\n",
+      "overall: ((770238, 17), (504874, 2), 265615L, 5, '0.0253% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">normal saline</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>49173.000000</td>\n",
+       "      <td>456484.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>389.563178</td>\n",
+       "      <td>75.626948</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>380.287765</td>\n",
+       "      <td>217.512467</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>-906.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>100.000000</td>\n",
+       "      <td>6.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>250.000000</td>\n",
+       "      <td>15.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>500.000000</td>\n",
+       "      <td>62.204886</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>11000.000000</td>\n",
+       "      <td>51947.999400</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         normal saline               \n",
+       "status                known               \n",
+       "variable_type            qn               \n",
+       "units                    mL          mL/hr\n",
+       "count          49173.000000  456484.000000\n",
+       "mean             389.563178      75.626948\n",
+       "std              380.287765     217.512467\n",
+       "min                0.000000    -906.000000\n",
+       "25%              100.000000       6.000000\n",
+       "50%              250.000000      15.000000\n",
+       "75%              500.000000      62.204886\n",
+       "max            11000.000000   51947.999400"
+      ]
+     },
+     "execution_count": 36,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_cln2 = cleaning_pipeline.transform(df_cln1)\n",
+    "print 'this step:',utils.data_loss(df_cln1,df_cln2)\n",
+    "print 'overall:',utils.data_loss(df_tr,df_cln2)\n",
+    "df_cln2.describe(include='all')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "array([[<matplotlib.axes._subplots.AxesSubplot object at 0x0000000043A236D8>,\n",
+       "        <matplotlib.axes._subplots.AxesSubplot object at 0x0000000029BE0C18>]], dtype=object)"
+      ]
+     },
+     "execution_count": 42,
+     "metadata": {},
+     "output_type": "execute_result"
+    },
+    {
+     "data": {
+      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAgAAAAFeCAYAAADzFKfgAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAAIABJREFUeJzt3X9clfX9//Hn+QGiHPBHYbd0DoyJpTMT0Fn+GE1Z2Nxn\nlVDg1Jrmr1Xb1HlDWop+0sA2P61ltvZpy88HW2K/1ubWKtJwMpdKN1xSWl/b1KwZoSUcCQ6c9/cP\nP5yJggeBA9r7cb/dvN0813W9r9f7fTjviyfnXOe6HMYYIwAAYBVnV3cAAAB0PgIAAAAWIgAAAGAh\nAgAAABYiAAAAYCECAAAAFrpoA8CaNWtUUlKitWvXavr06V3dnSauvPJKffrpp+3ezwsvvKB58+ZJ\nku677z7t2LGjXX3atWvXObeZPn261q5dqyNHjmjEiBFtrtWRvvGNb+h3v/tdl7TfuXOnrrzyyjbX\nbkv7tWvXauXKlefc12uvvaZHH320zf26UDGnz79PzOnzcyHN6UZPPfWUnnrqKeXk5OjJJ588rz60\n91hwUQaAPXv26MCBAxozZowiIiIUGRnZ1V1qwuFwdPg+V65cqWuvvbbN7bt3767u3bsH3aZHjx6S\nQjOGtmhNv0PVPiIiol2129u+pX1NmDBBpaWl2rdvX4fs+0LAnD5/zOnzdyHN6UZbtmzRxIkT29SH\n9h4L3G1q1cUeeeSRwF8IQ4cOVeO1jL7xjW/olltu0Y4dO/TRRx9p0qRJWrx4sSSpsLBQGzZskMvl\n0iWXXKJly5YpNjZWOTk5+vTTT/XBBx8oJSVFn3zyibp166a33npLlZWVSktLU58+fbRlyxZVVlZq\n5cqV+trXvqZ//vOf+s///E+dPHlSH3/8sa666io99NBDCg8PV0vXVvrFL36h1157TWFhYerVq5fy\n8/N16aWX6tlnn9WmTZtUX1+vTz/9VHPmzFFmZmaTttOnT9f06dM1dOhQ3XHHHfr617+uPXv26MSJ\nE/rhD3+oG2+8UZL0y1/+Uq+88oqMMerfv79yc3MVExOj6667TgkJCed8XpOSkjRs2LAmyw4cOKA5\nc+YoJydHV111VYu16+vrlZ+frx07dsjlcmn48OFasmSJnnvuOb311lv66U9/qvr6en3ta1/TT37y\nE91yyy168803lZeXp8WLF+uhhx7SgAED9N5778nn82nZsmUaNWqURo0apSFDhpyz3y+88IJefvll\n/fKXvzzr8entH374YW3evFl9+vRRYmKi9u7dq4KCAuXk5CgyMlLvvvuu/vWvf+mKK67QQw89pK98\n5SsaO3bsOWuf/rP55je/2eTx2LFjA+1zcnJa9bpqyZl9SU9P19q1a7V27dqg/bsYMKeZ06ezYU5L\nUlVVlbxery677DJJ0ptvvqmXX35ZlZWVGjRokP7rv/5LERERGjZsmCZMmKD9+/dr1apVHXcsMBeZ\nEydOmGuuucb4fL6z1l1//fVm9erVxhhj/vWvf5mrr77afPDBB+avf/2r+eY3v2mOHz9ujDHm+eef\nNzfeeKMxxpglS5aY733ve4F9LFmyxNx2222moaHBVFRUmMGDB5sNGzYYY4z5n//5HzNz5kxjjDGr\nV682v//9740xxvh8PvPtb3/bvPLKK8YYYwYPHhyo1eijjz4ySUlJpq6uzhhjzJNPPmmKioqM1+s1\nt912m/n000+NMcaUlZWZESNGBPo5d+5cY4wx06ZNMy+//LL54IMPzODBg83rr79ujDHm5ZdfNtdf\nf70xxpgXXnjBLFiwwDQ0NBhjjCksLDSzZ88+7+f4gw8+MCNGjDDvvvuuSU1NNX/7298Cy1uq/fDD\nD5t77rknUDsnJ8fk5uaaI0eOmDFjxhhjjHnjjTfM2LFjzaJFi4wxxjz44IPmiSeeMG+88YYZOnSo\n2bdvnzHGmN/85jdm2rRpre7v6c9Tc48b+zp58mRz8uRJU19fb2bPnm2mT59ujDn1M8/KyjI+n8/4\nfD5z8803m+eff77V9Rt/Ni09bqzRmtfVI488Yu6///6gNaurq83w4cNNbW1tq/t5oWJOM6fPZMuc\n/sMf/mDWrVsX2N+tt95qamtrTUNDg7n55pvNiy++aIw59fprfG2eqT3HgovuI4CDBw+qb9++crub\nf/NiwoQJkqTLLrtMl1xyiT777DNt375dkyZNUq9evSRJN998sz7++GMdOXJEkpSYmNhkH9dff72c\nTqcuvfRSde/eXePGjZMkffnLX9Znn30mSVq8eLF69+6tJ554QsuXL1dFRYW8Xm+L/b7ssst01VVX\n6eabb9bq1as1ePBgTZgwQT169NAvf/lLbd26VQ8//LAee+wx1dTUnPM5CAsL09e//nVJ0pAhQwJ9\nev3117Vnzx7dcsstuummm7RhwwYdPHjwnPtqSV1dnW6//XZdddVVTVJsS7X/8pe/KCsrS07nqZfU\n9OnTtW3bNvXr10+XXXaZ3nrrLf3lL3/R3LlztXPnTkmnPr9qTNj9+vXT4MGDz9pvR3njjTeUmpqq\n7t27y+Vy6dZbb22yfty4cXK73XK73UpISOjw+lLrXletFRkZKY/HE3gNX8yY08zptvgizOmioqLA\n61s69VoPDw+X0+lUQkKCjh07FliXlJTU7D7acyy46AKA0+lUQ0NDi+sjIiKaPDbGyO/3n7Wd3+9X\nfX29JJ31eWN4eHiTx80dmBYsWKBNmzapf//++t73vhf0LS2Hw6GCggLl5+erd+/eysvL0wMPPKCj\nR4/qpptu0kcffaTk5GT96Ec/Oud+pFMT9vT9mv97e9Lv92v27Nn63e9+p9/97nd67rnn9NRTTwXd\nX0seffRRvf3223r11VdbVft0DQ0Ngef3m9/8poqLi1VSUqK0tDT169dPf/rTn9S9e3cNGDBAktSt\nW7dm99saZ3626fP5ztqmW7duTfZ5+jikpq+bttQ/ffvm6kute12dj4aGBrlcrnbt40LAnGZOn8mG\nOe3z+XTw4MEmH+O09LOQFDiXozltPRZcdAFgwIABqqysVF1dXavbjBs3Ti+99FIgTT333HPq3bu3\nYmNj29yPkpIS3XXXXZo0aZKMMdqzZ885D2L79u3T5MmTFR8frzlz5uiOO+7Qvn379NZbb6lPnz6a\nP3++xowZo61bt0rSOV+sLa0bO3asnnnmGVVXV0uSfv7znys7O7tN4wsLC9OIESO0atUq5ebmqrKy\nMmjtp59+WvX19fL7/frtb3+rMWPGSJImTpyozZs3y+/369JLL9V1112nn/70p0pLS2tT387Uu3dv\nvfvuu6qrq1N9fb22bNly1jYpKSl66aWXVFVVJb/frxdffLFDaktSnz59tHfvXknSoUOHtH///nbt\nrzUHqurqatXW1uryyy9vV60LAXOaOX0mG+b0jh07gp4j0BrtORZcdCcBRkVFKTk5WW+88Ubg7ZZG\nZ6bGxsfXXXedbr/9dt1+++2STr24Hn/88VbVa+nM2QULFuiuu+5Sr1691L17d40aNUqHDh1qsc2V\nV16pSZMm6ZZbblGPHj3UvXt33XfffYqLi9Nzzz2nG264QZGRkRo2bJj69Olz1tt8p++zpT5lZGTo\n448/1m233San06nLL79ceXl5Z2130003adWqVRo6dGjQcY8aNUrf+ta3dO+992rZsmUt1v7+97+v\nBx98UDfddJMaGhp09dVXa+nSpZKk+Ph4ORyOwBnPY8eO1WOPPabU1NQW6zdnzpw5ysrK0vXXX99k\n+dixYzVq1CilpaWpb9+++trXvnbWhB01apRmzJihrKwsRUREqF+/fudVe+/evbrvvvua/frR/Pnz\ntWTJEr3++uu64oorNGrUqKD7O9cZ2Zs2bdILL7wQeDx48GA9/fTTTbbZvn27rr/++rP+6rkYMaeZ\n0zbO6cGDB2vy5Mmt6uu59t2uY8F5nzVwAXjzzTfNnDlzurobF62HHnrIvPPOO13djfO2adMm8+qr\nr3bIvv785z8HThhqrTNPQupKM2bMMPv37+/qbnQY5nT7MKcv/jndVu05FgT9CMAYo9zcXGVmZmrG\njBk6fPhwk/VbtmxRenq6MjMz9cwzz7SqTV5engoLCwOPN23apClTpigzM1Ovv/560NAyYsQIXXHF\nFdq+fXtrMg7O0L9//3ZdDKOruN3us/5S6CxHjx5VVlZWl9Q+U1FRkUaOHBn0K2Dn0pHz+tChQ5o6\ndaqmTZumFStWBPaxfv163XrrrbrtttsCFyupra3VD37wA333u9/V3Llzdfz4cUnM6fZiTp+/C2lO\nt1W7jwXBEsIrr7xilixZYow59XWW+fPnB9b5fD6TmppqqqqqTF1dnZkyZYqprKxssU1lZaW58847\nTWpqqtm4caMxxpiKigozefJk4/P5TFVVlZk8eXLgazUAQqMj5/W8efPMrl27jDHGLFu2zLz66qvm\n0KFDZsqUKYF9ZmZmmv3795snn3zSPPLII8YYY/74xz+alStXdsp4AZwt6DsApaWlgc/lhg8fHjgx\nQjp1QYnY2Fh5PB6FhYUpOTlZO3fuPKtNeXm5JOnkyZO655579B//8R+Bffz9739XUlKS3G63PB6P\n4uLi2n3CBYBz68h5XV5eruTkZEnS+PHjtWPHDvXr109PPPFEYJ8NDQ3q1q2bSktLNX78+CbbAuga\nQQNAdXW1oqKiAo/dbnfg6yFnruvRo0fgykanL3e5XPL7/frSl76kq6+++pz7b9wHgNDpqHnd0NDQ\n5AznyMhIVVVVyeVyBb6jv3r1ag0ZMkSxsbGqrq6Wx+MJbNt4djuAzhc0AHg8niYXw/D7/YELQ3g8\nniYT2Ov1qmfPnuds09z+z9xHdHT0OftkzuP7nADO1lHz2uVyNZnbp8/furo6LVq0SDU1NcrNzT2r\n7pmBoiXMdyA0gn4NMDExUVu3blVaWprKysqanGwQHx+vgwcP6sSJE4qIiNDu3bs1a9YsSWqxzZmu\nvvpq/fznP1ddXZ1qa2v1/vvva9CgQefsk8PhUEVF171LEBMT1aX1L4Q+2F7/QuhDTEzwX54t6ch5\nPWTIEO3atUsjR47Utm3bNHr0aEmnvkp17bXX6s4772xSt7i4WMOGDVNxcXHgo4Nz6ez53tk/1y9y\nvS/y2Dq7Xnvme0uCBoDU1FSVlJQEbmSRl5enzZs3q6amRhkZGcrJydHMmTNljFF6err69u3bbJuW\nXHrppZo+fbqmTp0qY4wWLlx41tWVAHSsjpzX2dnZWrp0qXw+n+Lj45WWlqaioiLt3r1bPp9PxcXF\ncjgcWrRokbKyspSdna2pU6cqPDxca9as6bLnALCdw1yk76919V9e/PVpd/0LoQ+h+IvgQvVF/avu\ni17vizy2zq4Xivl+0V0KGAAAtB8BAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAA\nCxEAAACwEAEAAAALEQAAALAQAQAAAAsFvRsgAHzRPfviS3r7/X9JkrpFhKn2c1+r245JHKQJXx8b\nqq4BIUMAAGC9f35YqX/Wxp56UHt+bfsd+rDjOwR0Aj4CAADAQgQAAAAsRAAAAMBCBAAAACxEAAAA\nwEIEAAAALEQAAADAQgQAAAAsRAAAAMBCBAAAACxEAAAAwEIX5b0AMmf/RGHde7VrHyc/O6pHV98n\nl8vVQb0CAODicVEGgEpfb0VED2rXPj7318oY00E9AgDg4sJHAAAAWIgAAACAhQgAAABYiAAAAICF\nCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgA\nAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAA\nWIgAAACAhdzBNjDGaPny5dq/f7/Cw8O1atUqDRgwILB+y5YtWrdundxut6ZMmaKMjIwW2xw6dEhL\nliyR0+nUoEGDlJubK0n6zW9+o82bN8vlcmnu3LmaOHFi6EYMAACCvwNQVFSkuro6bdy4UYsWLVJe\nXl5gXX19vfLz87V+/XoVFBSosLBQx44da7FNXl6eFi5cqA0bNsjv96uoqEhVVVUqKCjQM888o1//\n+td64IEHQjdaAAAgqRUBoLS0VOPGjZMkDR8+XHv37g2sO3DggGJjY+XxeBQWFqbk5GTt3LnzrDbl\n5eWSpPLyciUnJ0uSxo8frx07dqh79+7q37+/vF6vTp48KaeTTyUAAAi1oB8BVFdXKyoq6t8N3G75\n/X45nc6z1vXo0UNVVVXyer1NlrtcLjU0NMgYE1gWGRmpqqoqSdJll12mG2+8UcYYzZkzp0MGBgAA\nWhY0AHg8Hnm93sDjxl/+jeuqq6sD67xer3r27NlsG5fL1eSve6/Xq+joaG3btk2ffPKJtm7dKmOM\nZs2apcTERA0bNqxDBtgSp9OhmJgoud1Bn4JmxcREBd8oxLq6D7bXv1D6AABtEfS3X2JiorZu3aq0\ntDSVlZUpISEhsC4+Pl4HDx7UiRMnFBERod27d2vWrFmS1GybIUOGaNeuXRo5cqS2bdum0aNHKzo6\nWhEREQoLC5MkRUVFBd4ZCCW/36iioqpNASAmJkoVFaHv44XcB9vrXwh9IHwAaI+gv/1SU1NVUlKi\nzMxMSadO5Nu8ebNqamqUkZGhnJwczZw5U8YYpaenq2/fvs22kaTs7GwtXbpUPp9P8fHxSktLk8Ph\n0I4dO3TrrbfK6XQqKSlJ1113XQiHDAAAggYAh8OhFStWNFk2cODAwP9TUlKUkpIStI0kxcXFqaCg\n4Kzl99xzj+65557W9hkAALQTp9wDAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGCh\ntl0HF8BFrTNu8y1Jx44dU1ZWlv7whz8oPDxc0qkbgcXFxUmSRowYoQULFnTq2AGcQgAALHT6Lbv3\n7NmjvLw8rVu3TtK/b/P9/PPPq1u3bsrKytKECRNUWlrabJvG23wnJycrNzdXRUVFmjhxorZv3641\na9aosrIyUPfQoUMaOnSoHnvssa4aOoD/w0cAgIVCfZtv6dRdQNevX6+ePXsG9r13714dPXpUM2bM\n0Ny5c/WPf/yjU8YL4Gy8AwBYqDNu833ttddKUpP1ffv21dy5c3XDDTeotLRUixcv1rPPPhuycQJo\nGQEAsFCob/N9OofDEfj/V7/6VblcLklSUlKSKioqOnZgAFqNAABYKNS3+T7d6e8ArF27Vr169dKd\nd96pffv26fLLL29Vf0N96+Pu3cOkz9rWNjKyW7v719m3du7Mel/ksXVFvY5EAAAsFOrbfJ/u9HcA\n5syZo8WLF6u4uFhutzuwj2AqKqo6Ytgtqqnxtbmt11vbrv7FxESFfHxdVe+LPLbOrheKoEEAACzU\nGbf5bvTaa68F/h8dHa3HH3+8jb0G0JH4FgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAh\nAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIA\nAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAA\nFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYi\nAAAAYCF3sA2MMVq+fLn279+v8PBwrVq1SgMGDAis37Jli9atWye3260pU6YoIyOjxTaHDh3SkiVL\n5HQ6NWjQIOXm5kqSiouLtW7dOknS0KFDtWzZshANFwAASK14B6CoqEh1dXXauHGjFi1apLy8vMC6\n+vp65efna/369SooKFBhYaGOHTvWYpu8vDwtXLhQGzZskN/vV1FRkbxer372s5/p8ccfV2Fhofr3\n76/jx4+HbsQAACD4OwClpaUaN26cJGn48OHau3dvYN2BAwcUGxsrj8cjSUpOTtbOnTtVVlbWpE15\nebkkqby8XMnJyZKk8ePHq6SkRBEREUpISFB+fr4OHz6sjIwM9e7du2NHCQAAmggaAKqrqxUVFfXv\nBm63/H6/nE7nWet69Oihqqoqeb3eJstdLpcaGhpkjAksi4yMVHV1tY4fP6433nhDv//97xUREaHv\nfve7GjFihGJjYztqjAAA4AxBPwLweDzyer2Bx42//BvXVVdXB9Z5vV717Nmz2TYulyvQrnHb6Oho\n9erVS8OGDVOfPn3Uo0cPJScn65133umQwQEAgOYFfQcgMTFRW7duVVpamsrKypSQkBBYFx8fr4MH\nD+rEiROKiIjQ7t27NWvWLElqts2QIUO0a9cujRw5Utu2bdPo0aM1dOhQvffee/r000/l8Xi0Z88e\n3XbbbSEa7r85nQ7FxETJ7Q76FDQrJiYq+EYh1tV9sL3+hdIHAGiLoL/9UlNTVVJSoszMTEmnTuTb\nvHmzampqlJGRoZycHM2cOVPGGKWnp6tv377NtpGk7OxsLV26VD6fT/Hx8UpLS5PD4dDChQs1c+ZM\nORwO3XjjjfrKV74SwiGf4vcbVVRUtSkAxMREqaKiKgS9unj6YHv9C6EPhA8A7RH0t5/D4dCKFSua\nLBs4cGDg/ykpKUpJSQnaRpLi4uJUUFBw1vIbb7xRN954Y2v7DAAA2okLAQEAYCECAAAAFiIAAABg\nIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCEC\nAAAAFiIAAABgIQIAAAAWIgAAAGAhAgAAABYiAAAAYCECAAAAFiIAAABgIQIAAAAWIgAAAGAhAgBg\nIWOMcnNzlZmZqRkzZujw4cNN1m/ZskXp6enKzMzUM888c842hw4d0tSpUzVt2jStWLGiyX6OHTum\nG264QXV1dZKk2tpa/eAHP9B3v/tdzZ07V8ePH++E0QJoDgEAsFBRUZHq6uq0ceNGLVq0SHl5eYF1\n9fX1ys/P1/r161VQUKDCwkIdO3asxTZ5eXlauHChNmzYIL/fr6KiIknS9u3bNWvWLFVWVgb2/fTT\nTyshIUFPPfWUvvOd72jdunWdO3AAAQQAwEKlpaUaN26cJGn48OHau3dvYN2BAwcUGxsrj8ejsLAw\nJScna+fOnWe1KS8vlySVl5crOTlZkjR+/Hjt2LFDkuRyubR+/Xr17NmzSd3x48eftS2Azufu6g4A\n6HzV1dWKiooKPHa73fL7/XI6nWet69Gjh6qqquT1epssd7lcamhokDEmsCwyMlJVVVWSpGuvvVaS\nmqyvrq6Wx+MJbFtdXR2aAQIIigAAWMjj8cjr9QYeN/7yb1x3+i9mr9ernj17NtvG5XIF2jVuGx0d\n3aSWw+Fotu6ZgeJcYmJat11bde8eJn3WtraRkd3a3b9Qj68r632Rx9YV9ToSAQCwUGJiorZu3aq0\ntDSVlZUpISEhsC4+Pl4HDx7UiRMnFBERod27d2vWrFmS1GybIUOGaNeuXRo5cqS2bdum0aNHN6l1\n+jsAiYmJKi4u1rBhw1RcXBz46CCYioqq9g75nGpqfG1u6/XWtqt/MTFRIR9fV9X7Io+ts+uFImgQ\nAAALpaamqqSkRJmZmZJOnci3efNm1dTUKCMjQzk5OZo5c6aMMUpPT1ffvn2bbSNJ2dnZWrp0qXw+\nn+Lj45WWltak1unvAGRlZSk7O1tTp05VeHi41qxZ00kjBnAmAgBgIYfDcdZX9gYOHBj4f0pKilJS\nUoK2kaS4uDgVFBS0WOu1114L/D8iIkIPP/xwG3sNoCPxLQAAACxEAAAAwEIEAAAALEQAAADAQgQA\nAAAsRAAAAMBCBAAAACxEAAAAwEIEAAAALEQAAADAQgQAAAAsRAAAAMBCBAAAACxEAAAAwEIEAAAA\nLEQAAADAQgQAAAAsRAAAAMBCBAAAACxEAAAAwEIEAAAALEQAAADAQgQAAAAsFDQAGGOUm5urzMxM\nzZgxQ4cPH26yfsuWLUpPT1dmZqaeeeaZc7Y5dOiQpk6dqmnTpmnFihVn1Zk9e7YKCws7amwAAKAF\nQQNAUVGR6urqtHHjRi1atEh5eXmBdfX19crPz9f69etVUFCgwsJCHTt2rMU2eXl5WrhwoTZs2CC/\n36+ioqLAvn7+85+rqqoqBEMEAABnChoASktLNW7cOEnS8OHDtXfv3sC6AwcOKDY2Vh6PR2FhYUpO\nTtbOnTvPalNeXi5JKi8vV3JysiRp/Pjx2rFjhyTp5ZdfltPp1NixYzt2dAAAoFlBA0B1dbWioqIC\nj91ut/x+f7PrevTooaqqKnm93ibLXS6XGhoaZIwJLIuMjFRVVZXee+89bd68WT/4wQ86ZEAAACA4\nd7ANPB6PvF5v4LHf75fT6Qysq66uDqzzer3q2bNns21cLlegXeO20dHRevHFF/Xxxx9rxowZOnLk\niMLDw9W/f/+QvxvgdDoUExMltzvoU9CsmJio4BuFWFf3wfb6F0ofAKAtgv72S0xM1NatW5WWlqay\nsjIlJCQE1sXHx+vgwYM6ceKEIiIitHv3bs2aNUuSmm0zZMgQ7dq1SyNHjtS2bds0evRoTZo0KbC/\ntWvXKiYmplM+CvD7jSoqqtoUAGJiolRR0bXnK3R1H2yvfyH0gfABoD2C/vZLTU1VSUmJMjMzJZ06\nkW/z5s2qqalRRkaGcnJyNHPmTBljlJ6err59+zbbRpKys7O1dOlS+Xw+xcfHKy0tLYRDAwAALQka\nABwOx1lf2Rs4cGDg/ykpKUpJSQnaRpLi4uJUUFDQYq277747WHcAAEAH4EJAAABYiAAAAICFCAAA\nAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABY\niAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgA\nAACAhQgAAABYiAAAAICFCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFiIAAAA\ngIUIAADpki9qAAARWUlEQVQAWIgAAACAhQgAAABYiAAAAICF3F3dAQCdzxij5cuXa//+/QoPD9eq\nVas0YMCAwPotW7Zo3bp1crvdmjJlijIyMlpsc+jQIS1ZskROp1ODBg1Sbm6uJGnTpk0qLCxUWFiY\n5s2bp5SUFEnS+PHjFRcXJ0kaMWKEFixY0NnDByACAGCloqIi1dXVaePGjdqzZ4/y8vK0bt06SVJ9\nfb3y8/P1/PPPq1u3bsrKytKECRNUWlrabJu8vDwtXLhQycnJys3NVVFRka655hoVFBTohRde0Oef\nf66srCyNGTNGH330kYYOHarHHnusi58BAAQAwEKlpaUaN26cJGn48OHau3dvYN2BAwcUGxsrj8cj\nSUpOTtbOnTtVVlbWpE15ebkkqby8XMnJyZJO/XVfUlIip9OppKQkud1ueTwexcXFaf/+/Tp06JCO\nHj2qGTNmqHv37lqyZIkGDhzYmUMH8H84BwCwUHV1taKiogKP3W63/H5/s+t69Oihqqoqeb3eJstd\nLpcaGhpkjAksi4yMVHV19VnbNu6jb9++mjt3rv73f/9Xc+bM0eLFi0M5TADnwDsAgIU8Ho+8Xm/g\nsd/vl9PpDKyrrq4OrPN6verZs2ezbVwuV6Bd47bR0dHN7iM6Olrx8fFyuVySpKSkJFVUVLSqvzEx\nUcE3aofu3cOkz9rWNjKyW7v7F+rxdWW9L/LYuqJeRyIAABZKTEzU1q1blZaWprKyMiUkJATWxcfH\n6+DBgzpx4oQiIiK0e/duzZo1S5KabTNkyBDt2rVLI0eO1LZt2zR69GgNGzZMDz30kOrq6lRbW6v3\n339fgwYN0i9+8Qv16tVLd955p/bt26fLL7+8Vf2tqKjq+CfhNDU1vja39Xpr29W/mJiokI+vq+p9\nkcfW2fVCETQIAICFUlNTVVJSoszMTElSXl6eNm/erJqaGmVkZCgnJ0czZ86UMUbp6enq27dvs20k\nKTs7W0uXLpXP51N8fLzS0tLkcDg0ffp0TZ06VcYYLVy4UOHh4YG3/YuLi+V2uwP7AND5CACAhRwO\nh1asWNFk2ekn46WkpAS+tneuNpIUFxengoKCs5ZnZGQoIyOjybLo6Gg9/vjj7eg5gI7CSYAAAFiI\nAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICFCAAAAFgo6HUAOuO2oevXr9ef/vQnORwOjR8/Xnfd\ndVfoRgwAAIK/A3D6bUMXLVrU5MpdjbcNXb9+vQoKClRYWKhjx4612KbxtqEbNmyQ3+9XUVGRDh8+\nrM2bNwfuHb59+3a9++67oRsxAAAIHgBae9vQsLCwwG1Dz2zT0m1Dd+zYoX79+umJJ54I7LO+vl7d\nunXruBECAICzBA0AobxtaFVVlVwul3r16iVJWr16tYYMGaLY2Nj2jwwAALQo6DkAob5tqCTV1dUp\nJydHUVFRWr58ebsH1RpOp0MxMVFyu9t2O4QL4RaQXd0H2+tfKH0AgLYI+tsv1LcNlaT58+fr2muv\n1Z133hmKMTbL7zeqqKhqUwDo7FtOXoh9sL3+hdAHwgeA9gj62y/Utw0tKirS7t275fP5VFxcLIfD\noUWLFmn48OEhHDYAAHYLGgBCfdvQiRMnas+ePefTZwAA0E5cCAgAAAsRAAAAsBABAAAACxEAAACw\nEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBAB\nAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAA\nAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAAL\nEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEA\nAACwEAEAAAALEQAAALAQAQAAAAsRAAAAsBABAAAACxEAAACwEAEAAAALEQAAALCQO9gGxhgtX75c\n+/fvV3h4uFatWqUBAwYE1m/ZskXr1q2T2+3WlClTlJGR0WKbQ4cOacmSJXI6nRo0aJByc3MlSZs2\nbVJhYaHCwsI0b948paSkhGzAALpuXtfW1mrx4sWqrKyUx+NRfn6+evfu3VVPA2C1oO8AFBUVqa6u\nThs3btSiRYuUl5cXWFdfX6/8/HytX79eBQUFKiws1LFjx1psk5eXp4ULF2rDhg3y+/0qKirSJ598\nEmj7xBNPaM2aNfL5fKEbMYAum9dPP/20EhIS9NRTT+k73/mO1q1b11VPAWC9oO8AlJaWaty4cZKk\n4cOHa+/evYF1Bw4cUGxsrDwejyQpOTlZO3fuVFlZWZM25eXlkqTy8nIlJydLksaPH6+SkhI5nU4l\nJSXJ7XbL4/EoLi5O+/fv11e/+tWOHekZjN+vAwf+n9xu13m3PX7co2PHqgOP4+KukMt1/vsBukpX\nzOt9+/aptLRUs2fPDmxLAAC6TtAAUF1draioqH83cLvl9/vldDrPWtejRw9VVVXJ6/U2We5yudTQ\n0CBjTGBZZGSkqqurz9q2cR/nYqoPyq/PWzfCFlR9tFffX/EvRXj6tGs/n1cf032zU/XlL8e2az/n\n68wQ0tlsr98RfYiPH9SBvTk/XTGvG5c3BovGbS8IDbXyV74lSXK5nWqo97e66fEIpw4ceK/NpTv7\ntdyZ9b7IY2upXlfO6/MVNAB4PB55vd7A48aDROO60yew1+tVz549m23jcrkC7Rq3jY6ObnYf0dHR\n5+xT0bOPtGJoAFrSVfP69H2cGRLOJSamddu11eoVPwrp/oELUdBzABITE1VcXCxJKisrU0JCQmBd\nfHy8Dh48qBMnTqiurk67d+/WNddcoxEjRjTbZsiQIdq1a5ckadu2bUpKStKwYcNUWlqquro6VVVV\n6f3339egQRdPggIuRl01r0/fR3FxceCjAwCdz2FOf/+uGaef+SudOuGnvLxcNTU1ysjI0Ouvv661\na9fKGKP09HRlZWU122bgwIH65z//qaVLl8rn8yk+Pl4rV66Uw+HQM888o8LCQhljNH/+fE2cODH0\nIwcs1lXz+vPPP1d2drYqKioUHh6uNWvW6JJLLunKpwKwVtAAAAAAvni4EBAAABYiAAAAYCECAAAA\nFgr6NcALSbDLl7ZHfX297r33Xh05ckQ+n0/z5s3TV77ylS65xGllZaWmTJmiJ598Ui6Xq1P78Ktf\n/UpbtmyRz+fT1KlTNXLkyE6tX19fr+zsbB05ckRut1v3339/pz0He/bs0c9+9jMVFBR0yOVty8rK\n9MADD8jtduu6667T3Xff3er677zzjlauXCmXy6Xw8HA9+OCD6tOnT0jrd4VXX31Vf/7zn7VmzRpJ\np56DVatWndXntWvXqri4WG63Wzk5Obr66qt1/Phx/fjHP1Ztba369u2rvLw8devWrdnLGLdGRx1f\nOut1FKpjVkv1/H6/7rvvPv3jH/+Q0+nUihUrFB4eHtJ50tHHwnPVuuWWWwLXqPjSl76kefPmhbRe\nKI615z3nzUXklVdeMUuWLDHGGFNWVmbmz5/fYft+7rnnzAMPPGCMMeazzz4zKSkpZt68eWbXrl3G\nGGOWLVtmXn31VVNRUWEmT55sfD6fqaqqMpMnTzZ1dXXmySefNI888ogxxpg//vGPZuXKlW3qh8/n\nM3fddZe54YYbzPvvv9+pfXjjjTfMvHnzjDHGeL1e88gjj3T6c1BUVGR+9KMfGWOMKSkpMffcc0+n\n9OG///u/zeTJk81tt91mjDEdUvM73/mOOXz4sDHGmNmzZ5t33nmn1fWnTZtm9u3bZ4wxZuPGjSY/\nPz+k9bvCypUrzaRJk8zChQsDy5rrc3l5ubn99tuNMcZ8+OGHZsqUKcYYY+6//37zwgsvGGOMefzx\nx8369euNz+czqamppqqqytTV1ZkpU6aYysrKVvWnI44vnfk6CtUxq6V6r776qrn33nuNMaeOFfPn\nzw9pvVAcC1uqVVtba26++eYmP8tQ1gvVsfZ85/xF9RHAuS5f2l6TJk3SD3/4Q0lSQ0ODXC6X3n77\n7SaXOP3rX/+qv//97y1e4nT8+PGBbXfs2NGmfqxevVpZWVnq27evjDGd2oft27crISFB3//+9zV/\n/nylpKR0+nMQFxcXuLpcVVWV3G53p/QhNjZWjz76aODxmZe3PZ+af/vb31RdXS2fz6cvfelLkqSx\nY8fqr3/9a6vrP/TQQxo8eLCkU3/phYeHh7R+V0hMTNTy5csDj5vrc0lJiUpLSzVmzBhJ0uWXXy6/\n369jx47pzTffDBwPGn/Wp1/GOCwsTElJSYFrFATTEceXznwddfQxK1i9iRMn6v7775ckffjhh+rZ\ns2dI63XksTBYrX379unkyZOaNWuW7rjjDu3Zsyek9Tr6WNvWOX9RBYCWLl/aEbp37x64XOkPf/hD\nLViwoNMvcfr888/rkksu0ZgxYwK1Tx9fqPtw/Phx7d27V7/4xS+0fPly/fjHP+7U+o3tPvjgA6Wl\npWnZsmWaPn16p/wcUlNTm9zPoT01Gy+b27js9OWtrX/ppZdKkt5880399re/1R133NHsJXo7qn4o\nPfvss/r2t7/d5N/evXs1adKkJtu11Oczn/fmfh7n2ra14+6I40tnvo46+pjVmteN0+nUkiVLtHLl\nSk2ePDlk9Tr6WBhsbBEREZo1a5Z+/etfB459oXwuO/pY29Y5f1GdA3Cuy5d2hI8++kh33323pk2b\npm9961v66U9/GlgXqkucnu7555+Xw+FQSUmJ9u/fr+zsbB0/frzT+tCrVy/Fx8fL7XZr4MCB6tat\nm44ePdqpz8H69es1btw4LViwQEePHtX06dOb3B2yM/ogqd2Xtz0zfLTmEtdn+tOf/qTHH39cv/rV\nr9S7d+9Or99R0tPTlZ6eHnS75vrcs2dPhYWFNZn31dXVio6ODmzfp0+fwLjbcmnxRqE4voT6ddTR\nx6zWvG7y8/NVWVmp9PR01dbWhqReKI6F5xpbXFycYmNjA//v1auX3n777ZDVC8Wxti1z/qJ6B+Bc\nly9tr08++USzZs3S4sWLdfPNN0uSrrrqqk69xOmGDRtUUFCggoICXXnllXrwwQc1bty4TutDUlKS\n/vKXv0iSjh49qpqaGo0ePVo7d+7stOeg8ZrzkhQVFaX6+noNGTKkU/sgtf/yth6PR+Hh4Tp8+LCM\nMdq+fbuSkpJaXf/FF1/UU089pYKCAvXv31+SdPXVV3da/a7QUp9HjBih7du3yxijDz/8UMYY9erV\nS4mJidq2bZukUz+j5ORkXXHFFU0uY7xr1y5dc801raofiuNLKF9HoThmnaveiy++qF/96leSpG7d\nusnpdOqrX/1qu+ZmS/VCcSw819iee+455efnSzp17KuurtaYMWNCMjYpNMfatsz5i+pKgKaFS5F2\nhFWrVumll17SFVdcIWOMHA6HfvKTn2jlypVdconTGTNmaMWKFXI4HJ16mdWf/exn+tvf/iZjjBYt\nWqT+/fvrvvvu67T6J0+e1L333quKigrV19fr9ttv19ChQzulD0eOHNGiRYu0cePGDrm87d///net\nWrVKfr9fY8aM0Y9+dO4bzjTW/+1vf6trr71W/fr1k8fjkcPh0KhRo3T33XeHtH5X2LlzpwoLCwPf\nAmipz2vXrtW2bdtkjFFOTo4SExNVWVmp7OxsnTx5Ur1799aaNWsUERHR7GWMW6Ojji+d9ToK1TGr\npXo1NTXKycnRJ598ovr6es2dO1dXXHFFu+dmsNdpRx4LW6rl8/mUk5OjDz/8UE6nU4sXL1avXr1C\nOrZQHGvPd85fVAEAAAB0jIvqIwAAANAxCAAAAFiIAAAAgIUIAAAAWIgAAACAhQgAAABYiAAAAICF\nCAAAAFjo/wOY67O5O3hY0wAAAABJRU5ErkJggg==\n",
+      "text/plain": [
+       "<matplotlib.figure.Figure at 0x43a236a0>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "import seaborn as sns\n",
+    "df_cln2.hist(normed=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Single pipeline"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "all_pipeline = Pipeline([\n",
+    "        ('transform',mimic_transform),\n",
+    "        ('format',standard_pipeline),\n",
+    "        ('clean',cleaning_pipeline)\n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>382993.000000</td>\n",
+       "      <td>393608</td>\n",
+       "      <td>393608</td>\n",
+       "      <td>393608</td>\n",
+       "      <td>393608.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>187323</td>\n",
+       "      <td>616</td>\n",
+       "      <td>2</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2140-07-14 03:59:00</td>\n",
+       "      <td>1.2</td>\n",
+       "      <td>mmol/L</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>8</td>\n",
+       "      <td>20704</td>\n",
+       "      <td>393592</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>first</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2096-08-25 16:32:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>last</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2210-08-19 04:56:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>150112.612539</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>64364.242439</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>28874.716612</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>77900.842790</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>100001.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>818.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>125190.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1531.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>149789.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>50813.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>175567.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>50813.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>199999.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>225668.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                   id             datetime   value   units         itemid\n",
+       "count   382993.000000               393608  393608  393608  393608.000000\n",
+       "unique            NaN               187323     616       2            NaN\n",
+       "top               NaN  2140-07-14 03:59:00     1.2  mmol/L            NaN\n",
+       "freq              NaN                    8   20704  393592            NaN\n",
+       "first             NaN  2096-08-25 16:32:00     NaN     NaN            NaN\n",
+       "last              NaN  2210-08-19 04:56:00     NaN     NaN            NaN\n",
+       "mean    150112.612539                  NaN     NaN     NaN   64364.242439\n",
+       "std      28874.716612                  NaN     NaN     NaN   77900.842790\n",
+       "min     100001.000000                  NaN     NaN     NaN     818.000000\n",
+       "25%     125190.000000                  NaN     NaN     NaN    1531.000000\n",
+       "50%     149789.000000                  NaN     NaN     NaN   50813.000000\n",
+       "75%     175567.000000                  NaN     NaN     NaN   50813.000000\n",
+       "max     199999.000000                  NaN     NaN     NaN  225668.000000"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "label = 'lactate'\n",
+    "df = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n",
+    "df.describe(include='all')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th>mmol/L</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>100001</th>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>1.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100003</th>\n",
+       "      <th>2150-04-17 19:12:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100006</th>\n",
+       "      <th>2108-04-08 10:58:00</th>\n",
+       "      <td>4.5</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100007</th>\n",
+       "      <th>2145-03-31 00:44:00</th>\n",
+       "      <td>3.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2145-04-02 14:10:00</th>\n",
+       "      <td>1.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100009</th>\n",
+       "      <th>2162-05-17 13:19:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2162-05-17 17:14:00</th>\n",
+       "      <td>1.5</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">100010</th>\n",
+       "      <th>2109-12-10 10:25:00</th>\n",
+       "      <td>0.6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 12:11:00</th>\n",
+       "      <td>0.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:05:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:58:00</th>\n",
+       "      <td>0.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100011</th>\n",
+       "      <th>2177-08-29 04:44:00</th>\n",
+       "      <td>3.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-08-29 06:55:00</th>\n",
+       "      <td>2.3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100012</th>\n",
+       "      <th>2177-03-14 07:38:00</th>\n",
+       "      <td>2.3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-14 11:42:00</th>\n",
+       "      <td>2.5</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 08:05:00</th>\n",
+       "      <td>2.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 14:01:00</th>\n",
+       "      <td>2.6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 21:42:00</th>\n",
+       "      <td>1.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100016</th>\n",
+       "      <th>2188-05-24 12:00:00</th>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100017</th>\n",
+       "      <th>2103-03-11 05:10:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100018</th>\n",
+       "      <th>2176-08-29 15:29:00</th>\n",
+       "      <td>1.3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 09:23:00</th>\n",
+       "      <td>0.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 10:19:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 11:29:00</th>\n",
+       "      <td>0.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 12:40:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100020</th>\n",
+       "      <th>2142-11-30 21:54:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2142-12-03 00:17:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100024</th>\n",
+       "      <th>2170-09-19 10:25:00</th>\n",
+       "      <td>1.4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-19 16:33:00</th>\n",
+       "      <td>2.6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-20 02:04:00</th>\n",
+       "      <td>3.2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199976</th>\n",
+       "      <th>2182-02-14 11:15:00</th>\n",
+       "      <td>0.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-16 03:57:00</th>\n",
+       "      <td>0.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-19 03:59:00</th>\n",
+       "      <td>0.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-20 03:31:00</th>\n",
+       "      <td>0.7</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-21 04:55:00</th>\n",
+       "      <td>0.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199979</th>\n",
+       "      <th>2182-02-06 09:17:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-06 14:16:00</th>\n",
+       "      <td>3.8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">199981</th>\n",
+       "      <th>2110-09-24 16:34:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-24 20:09:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-25 06:10:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>199987</th>\n",
+       "      <th>2175-05-19 16:30:00</th>\n",
+       "      <td>2.3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"6\" valign=\"top\">199988</th>\n",
+       "      <th>2169-01-24 12:48:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 01:35:00</th>\n",
+       "      <td>1.6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 11:18:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 16:43:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 22:35:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-10 05:33:00</th>\n",
+       "      <td>1.4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199993</th>\n",
+       "      <th>2161-11-12 23:14:00</th>\n",
+       "      <td>0.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2161-11-13 03:46:00</th>\n",
+       "      <td>0.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">199994</th>\n",
+       "      <th>2188-07-07 21:23:00</th>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 03:09:00</th>\n",
+       "      <td>0.7</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 04:13:00</th>\n",
+       "      <td>0.6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 06:20:00</th>\n",
+       "      <td>0.7</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199998</th>\n",
+       "      <th>2119-02-20 10:52:00</th>\n",
+       "      <td>1.1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 12:36:00</th>\n",
+       "      <td>1.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:33:00</th>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:59:00</th>\n",
+       "      <td>2.6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 20:43:00</th>\n",
+       "      <td>1.3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-04 20:55:00</th>\n",
+       "      <td>1.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-06 15:29:00</th>\n",
+       "      <td>1.8</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>177439 rows × 1 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      lactate\n",
+       "status                       known\n",
+       "variable_type                   qn\n",
+       "units                       mmol/L\n",
+       "id     datetime                   \n",
+       "100001 2117-09-11 09:32:00     1.9\n",
+       "100003 2150-04-17 19:12:00     1.1\n",
+       "100006 2108-04-08 10:58:00     4.5\n",
+       "100007 2145-03-31 00:44:00     3.1\n",
+       "       2145-04-02 14:10:00     1.9\n",
+       "100009 2162-05-17 13:19:00     1.1\n",
+       "       2162-05-17 17:14:00     1.5\n",
+       "100010 2109-12-10 10:25:00     0.6\n",
+       "       2109-12-10 12:11:00     0.9\n",
+       "       2109-12-10 13:05:00     1.0\n",
+       "       2109-12-10 13:58:00     0.8\n",
+       "100011 2177-08-29 04:44:00     3.8\n",
+       "       2177-08-29 06:55:00     2.3\n",
+       "100012 2177-03-14 07:38:00     2.3\n",
+       "       2177-03-14 11:42:00     2.5\n",
+       "       2177-03-15 08:05:00     2.1\n",
+       "       2177-03-15 14:01:00     2.6\n",
+       "       2177-03-15 21:42:00     1.8\n",
+       "100016 2188-05-24 12:00:00     2.0\n",
+       "100017 2103-03-11 05:10:00     1.1\n",
+       "100018 2176-08-29 15:29:00     1.3\n",
+       "       2176-08-30 09:23:00     0.9\n",
+       "       2176-08-30 10:19:00     1.0\n",
+       "       2176-08-30 11:29:00     0.9\n",
+       "       2176-08-30 12:40:00     1.1\n",
+       "100020 2142-11-30 21:54:00     1.1\n",
+       "       2142-12-03 00:17:00     1.0\n",
+       "100024 2170-09-19 10:25:00     1.4\n",
+       "       2170-09-19 16:33:00     2.6\n",
+       "       2170-09-20 02:04:00     3.2\n",
+       "...                            ...\n",
+       "199976 2182-02-14 11:15:00     0.8\n",
+       "       2182-02-16 03:57:00     0.8\n",
+       "       2182-02-19 03:59:00     0.8\n",
+       "       2182-02-20 03:31:00     0.7\n",
+       "       2182-02-21 04:55:00     0.9\n",
+       "199979 2182-02-06 09:17:00     1.0\n",
+       "       2182-02-06 14:16:00     3.8\n",
+       "199981 2110-09-24 16:34:00     1.1\n",
+       "       2110-09-24 20:09:00     1.0\n",
+       "       2110-09-25 06:10:00     1.0\n",
+       "199987 2175-05-19 16:30:00     2.3\n",
+       "199988 2169-01-24 12:48:00     1.0\n",
+       "       2169-02-07 01:35:00     1.6\n",
+       "       2169-02-07 11:18:00     1.0\n",
+       "       2169-02-07 16:43:00     1.0\n",
+       "       2169-02-07 22:35:00     1.1\n",
+       "       2169-02-10 05:33:00     1.4\n",
+       "199993 2161-11-12 23:14:00     0.9\n",
+       "       2161-11-13 03:46:00     0.9\n",
+       "199994 2188-07-07 21:23:00     1.0\n",
+       "       2188-07-08 03:09:00     0.7\n",
+       "       2188-07-08 04:13:00     0.6\n",
+       "       2188-07-08 06:20:00     0.7\n",
+       "199998 2119-02-20 10:52:00     1.1\n",
+       "       2119-02-20 12:36:00     1.9\n",
+       "       2119-02-20 13:33:00     2.0\n",
+       "       2119-02-20 13:59:00     2.6\n",
+       "       2119-02-20 20:43:00     1.3\n",
+       "199999 2136-04-04 20:55:00     1.9\n",
+       "       2136-04-06 15:29:00     1.8\n",
+       "\n",
+       "[177439 rows x 1 columns]"
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "all_pipeline.set_params(transform__add_level__level_val=label)\n",
+    "all_pipeline.transform(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Loop over everything"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import logger"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:18:23) heart rate\n",
+      "(2017-06-03 07:18:23)>> Open Extract\n",
+      "(2017-06-03 07:18:26)<< DONE (3.0s)\n",
+      "(2017-06-03 07:18:26)>> Run Pipeline\n",
+      "(2017-06-03 07:21:19)<< DONE (173.0s)\n",
+      "(2017-06-03 07:21:19)>> Analyze...\n",
+      "((7952939, 1), (7922961, 1), 29978L, 171, '0.3015% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>heart rate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>beats/min</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>7.922961e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>1.026618e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>3.552932e+03</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-8.800000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>7.700000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>9.200000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>1.190000e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>9.999999e+06</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label            heart rate\n",
+       "status                known\n",
+       "variable_type            qn\n",
+       "units             beats/min\n",
+       "count          7.922961e+06\n",
+       "mean           1.026618e+02\n",
+       "std            3.552932e+03\n",
+       "min           -8.800000e+01\n",
+       "25%            7.700000e+01\n",
+       "50%            9.200000e+01\n",
+       "75%            1.190000e+02\n",
+       "max            9.999999e+06"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:21:20)<< DONE (1.0s)\n",
+      "(2017-06-03 07:21:20)>> Joining!\n",
+      "(2017-06-03 07:21:20)<< DONE (0.0s)\n",
+      "(2017-06-03 07:21:20) DONE (177.0s)\n",
+      "(2017-06-03 07:21:20) blood pressure systolic\n",
+      "(2017-06-03 07:21:20)>> Open Extract\n",
+      "(2017-06-03 07:21:23)<< DONE (3.0s)\n",
+      "(2017-06-03 07:21:23)>> Run Pipeline\n",
+      "(2017-06-03 07:25:39)<< DONE (256.0s)\n",
+      "(2017-06-03 07:25:39)>> Analyze...\n",
+      "((6374824, 1), (5974186, 1), 548979L, 174, '0.307% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>blood pressure systolic</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mmHg</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>5.825845e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>1.214682e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>1.311542e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-6.900000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>1.040000e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>1.190000e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>1.370000e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>1.411460e+05</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         blood pressure systolic\n",
+       "status                          known\n",
+       "variable_type                      qn\n",
+       "units                            mmHg\n",
+       "count                    5.825845e+06\n",
+       "mean                     1.214682e+02\n",
+       "std                      1.311542e+02\n",
+       "min                     -6.900000e+01\n",
+       "25%                      1.040000e+02\n",
+       "50%                      1.190000e+02\n",
+       "75%                      1.370000e+02\n",
+       "max                      1.411460e+05"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:25:40)<< DONE (1.0s)\n",
+      "(2017-06-03 07:25:40)>> Joining!\n",
+      "(2017-06-03 07:26:28)<< DONE (48.0s)\n",
+      "(2017-06-03 07:26:28) DONE (308.0s)\n",
+      "(2017-06-03 07:26:28) blood pressure diastolic\n",
+      "(2017-06-03 07:26:28)>> Open Extract\n",
+      "(2017-06-03 07:26:31)<< DONE (3.0s)\n",
+      "(2017-06-03 07:26:31)>> Run Pipeline\n",
+      "(2017-06-03 07:30:32)<< DONE (241.0s)\n",
+      "(2017-06-03 07:30:32)>> Analyze...\n",
+      "((6371249, 1), (5976313, 1), 543269L, 170, '0.2999% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>blood pressure diastolic</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mmHg</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>5.827980e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>6.115824e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>2.350768e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-1.600000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>5.000000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>5.900000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>6.900000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>1.141090e+05</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         blood pressure diastolic\n",
+       "status                           known\n",
+       "variable_type                       qn\n",
+       "units                             mmHg\n",
+       "count                     5.827980e+06\n",
+       "mean                      6.115824e+01\n",
+       "std                       2.350768e+02\n",
+       "min                      -1.600000e+01\n",
+       "25%                       5.000000e+01\n",
+       "50%                       5.900000e+01\n",
+       "75%                       6.900000e+01\n",
+       "max                       1.141090e+05"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:30:34)<< DONE (2.0s)\n",
+      "(2017-06-03 07:30:34)>> Joining!\n",
+      "(2017-06-03 07:31:25)<< DONE (51.0s)\n",
+      "(2017-06-03 07:31:25) DONE (297.0s)\n",
+      "(2017-06-03 07:31:25) blood pressure mean\n",
+      "(2017-06-03 07:31:25)>> Open Extract\n",
+      "(2017-06-03 07:31:26)<< DONE (1.0s)\n",
+      "(2017-06-03 07:31:26)>> Run Pipeline\n",
+      "(2017-06-03 07:32:39)<< DONE (73.0s)\n",
+      "(2017-06-03 07:32:39)>> Analyze...\n",
+      "((2536271, 1), (2415995, 1), 120276L, 0, '0.0% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>blood pressure mean</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mmHg</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>2.415995e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>7.879668e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>1.413279e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-1.350000e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>6.700000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>7.700000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>8.800000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>1.201300e+05</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         blood pressure mean\n",
+       "status                      known\n",
+       "variable_type                  qn\n",
+       "units                        mmHg\n",
+       "count                2.415995e+06\n",
+       "mean                 7.879668e+01\n",
+       "std                  1.413279e+02\n",
+       "min                 -1.350000e+02\n",
+       "25%                  6.700000e+01\n",
+       "50%                  7.700000e+01\n",
+       "75%                  8.800000e+01\n",
+       "max                  1.201300e+05"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:32:40)<< DONE (1.0s)\n",
+      "(2017-06-03 07:32:40)>> Joining!\n",
+      "(2017-06-03 07:33:20)<< DONE (40.0s)\n",
+      "(2017-06-03 07:33:20) DONE (115.0s)\n",
+      "(2017-06-03 07:33:20) respiratory rate\n",
+      "(2017-06-03 07:33:20)>> Open Extract\n",
+      "(2017-06-03 07:33:24)<< DONE (4.0s)\n",
+      "(2017-06-03 07:33:24)>> Run Pipeline\n",
+      "(2017-06-03 07:37:33)<< DONE (249.0s)\n",
+      "(2017-06-03 07:37:33)>> Analyze...\n",
+      "((7810019, 1), (7780015, 1), 5072936L, 172, '0.3035% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>respiratory rate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>insp/min</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>2.737083e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>2.092347e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>1.423811e+03</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000e+00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>1.600000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>2.000000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>2.400000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>2.355555e+06</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         respiratory rate\n",
+       "status                   known\n",
+       "variable_type               qn\n",
+       "units                 insp/min\n",
+       "count             2.737083e+06\n",
+       "mean              2.092347e+01\n",
+       "std               1.423811e+03\n",
+       "min               0.000000e+00\n",
+       "25%               1.600000e+01\n",
+       "50%               2.000000e+01\n",
+       "75%               2.400000e+01\n",
+       "max               2.355555e+06"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:37:35)<< DONE (2.0s)\n",
+      "(2017-06-03 07:37:35)>> Joining!\n",
+      "(2017-06-03 07:38:29)<< DONE (54.0s)\n",
+      "(2017-06-03 07:38:29) DONE (309.0s)\n",
+      "(2017-06-03 07:38:29) temperature body\n",
+      "(2017-06-03 07:38:29)>> Open Extract\n",
+      "(2017-06-03 07:38:31)<< DONE (2.0s)\n",
+      "(2017-06-03 07:38:31)>> Run Pipeline\n",
+      "(2017-06-03 07:39:35)<< DONE (64.0s)\n",
+      "(2017-06-03 07:39:35)>> Analyze...\n",
+      "((1751447, 1), (1731794, 1), 461152L, 156, '0.3189% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>degF</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>1.290295e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>9.850479e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>9.563484e+00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-9.990000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>9.760000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>9.850000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>9.950000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>9.637000e+03</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         temperature body\n",
+       "status                   known\n",
+       "variable_type               qn\n",
+       "units                     degF\n",
+       "count             1.290295e+06\n",
+       "mean              9.850479e+01\n",
+       "std               9.563484e+00\n",
+       "min              -9.990000e+01\n",
+       "25%               9.760000e+01\n",
+       "50%               9.850000e+01\n",
+       "75%               9.950000e+01\n",
+       "max               9.637000e+03"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:39:36)<< DONE (1.0s)\n",
+      "(2017-06-03 07:39:36)>> Joining!\n",
+      "(2017-06-03 07:40:14)<< DONE (38.0s)\n",
+      "(2017-06-03 07:40:14) DONE (105.0s)\n",
+      "(2017-06-03 07:40:14) oxygen saturation pulse oximetry\n",
+      "(2017-06-03 07:40:14)>> Open Extract\n",
+      "(2017-06-03 07:40:17)<< DONE (3.0s)\n",
+      "(2017-06-03 07:40:17)>> Run Pipeline\n",
+      "(2017-06-03 07:42:42)<< DONE (145.0s)\n",
+      "(2017-06-03 07:42:42)>> Analyze...\n",
+      "((6099827, 1), (6073019, 1), 26808L, 163, '0.3326% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>oxygen saturation pulse oximetry</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>percent</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>6.073019e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>9.885942e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>2.942035e+03</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000e+00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>9.600000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>9.800000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>9.900000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>6.363333e+06</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         oxygen saturation pulse oximetry\n",
+       "status                                   known\n",
+       "variable_type                               qn\n",
+       "units                                  percent\n",
+       "count                             6.073019e+06\n",
+       "mean                              9.885942e+01\n",
+       "std                               2.942035e+03\n",
+       "min                               0.000000e+00\n",
+       "25%                               9.600000e+01\n",
+       "50%                               9.800000e+01\n",
+       "75%                               9.900000e+01\n",
+       "max                               6.363333e+06"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:42:43)<< DONE (1.0s)\n",
+      "(2017-06-03 07:42:43)>> Joining!\n",
+      "(2017-06-03 07:43:35)<< DONE (52.0s)\n",
+      "(2017-06-03 07:43:35) DONE (201.0s)\n",
+      "(2017-06-03 07:43:35) weight body\n",
+      "(2017-06-03 07:43:35)>> Open Extract\n",
+      "(2017-06-03 07:43:36)<< DONE (1.0s)\n",
+      "(2017-06-03 07:43:36)>> Run Pipeline\n",
+      "(2017-06-03 07:43:40)<< DONE (4.0s)\n",
+      "(2017-06-03 07:43:40)>> Analyze...\n",
+      "((95425, 1), (94457, 1), 1956L, 158, '0.4958% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>weight body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>kg</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>9.346900e+04</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>2.676828e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>3.908673e+04</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000e+00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>6.980000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>8.340000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>9.890000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>8.654765e+06</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label           weight body\n",
+       "status                known\n",
+       "variable_type            qn\n",
+       "units                    kg\n",
+       "count          9.346900e+04\n",
+       "mean           2.676828e+02\n",
+       "std            3.908673e+04\n",
+       "min            0.000000e+00\n",
+       "25%            6.980000e+01\n",
+       "50%            8.340000e+01\n",
+       "75%            9.890000e+01\n",
+       "max            8.654765e+06"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:43:40)<< DONE (0.0s)\n",
+      "(2017-06-03 07:43:40)>> Joining!\n",
+      "(2017-06-03 07:44:15)<< DONE (35.0s)\n",
+      "(2017-06-03 07:44:15) DONE (40.0s)\n",
+      "(2017-06-03 07:44:15) output urine\n",
+      "(2017-06-03 07:44:15)>> Open Extract\n",
+      "(2017-06-03 07:44:16)<< DONE (1.0s)\n",
+      "(2017-06-03 07:44:16)>> Run Pipeline\n",
+      "(2017-06-03 07:47:57)<< DONE (221.0s)\n",
+      "(2017-06-03 07:47:57)>> Analyze...\n",
+      "((3644639, 1), (3624029, 1), 417242L, 92, '0.1758% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>output urine</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mL</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>3.216363e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>1.265574e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>2.577291e+03</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-1.500000e+03</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>4.200000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>8.000000e+01</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>1.600000e+02</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>4.555555e+06</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label          output urine\n",
+       "status                known\n",
+       "variable_type            qn\n",
+       "units                    mL\n",
+       "count          3.216363e+06\n",
+       "mean           1.265574e+02\n",
+       "std            2.577291e+03\n",
+       "min           -1.500000e+03\n",
+       "25%            4.200000e+01\n",
+       "50%            8.000000e+01\n",
+       "75%            1.600000e+02\n",
+       "max            4.555555e+06"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:47:58)<< DONE (1.0s)\n",
+      "(2017-06-03 07:47:58)>> Joining!\n",
+      "(2017-06-03 07:48:43)<< DONE (45.0s)\n",
+      "(2017-06-03 07:48:43) DONE (268.0s)\n",
+      "(2017-06-03 07:48:43) glasgow coma scale motor\n",
+      "(2017-06-03 07:48:43)>> Open Extract\n",
+      "(2017-06-03 07:48:43)<< DONE (0.0s)\n",
+      "(2017-06-03 07:48:43)>> Run Pipeline\n",
+      "(2017-06-03 07:49:29)<< DONE (46.0s)\n",
+      "(2017-06-03 07:49:29)>> Analyze...\n",
+      "((952565, 1), (949198, 1), 3367L, 1, '0.0037% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>glasgow coma scale motor</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>ord</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>949198</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>Obeys commands</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>642879</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         glasgow coma scale motor\n",
+       "status                           known\n",
+       "variable_type                      ord\n",
+       "units                         no_units\n",
+       "count                           949198\n",
+       "unique                               6\n",
+       "top                     Obeys commands\n",
+       "freq                            642879"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:49:29)<< DONE (0.0s)\n",
+      "(2017-06-03 07:49:29)>> Joining!\n",
+      "(2017-06-03 07:50:06)<< DONE (37.0s)\n",
+      "(2017-06-03 07:50:06) DONE (83.0s)\n",
+      "(2017-06-03 07:50:06) glasgow coma scale eye opening\n",
+      "(2017-06-03 07:50:06)>> Open Extract\n",
+      "(2017-06-03 07:50:07)<< DONE (1.0s)\n",
+      "(2017-06-03 07:50:07)>> Run Pipeline\n",
+      "(2017-06-03 07:50:50)<< DONE (43.0s)\n",
+      "(2017-06-03 07:50:50)>> Analyze...\n",
+      "((956672, 1), (953595, 1), 3077L, 1, '0.0037% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>glasgow coma scale eye opening</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>ord</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>953595</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>Eyes open spontaneously</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>588057</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         glasgow coma scale eye opening\n",
+       "status                                 known\n",
+       "variable_type                            ord\n",
+       "units                               no_units\n",
+       "count                                 953595\n",
+       "unique                                     4\n",
+       "top                  Eyes open spontaneously\n",
+       "freq                                  588057"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:50:50)<< DONE (0.0s)\n",
+      "(2017-06-03 07:50:50)>> Joining!\n",
+      "(2017-06-03 07:51:28)<< DONE (38.0s)\n",
+      "(2017-06-03 07:51:28) DONE (82.0s)\n",
+      "(2017-06-03 07:51:28) glasgow coma scale verbal\n",
+      "(2017-06-03 07:51:28)>> Open Extract\n",
+      "(2017-06-03 07:51:29)<< DONE (1.0s)\n",
+      "(2017-06-03 07:51:29)>> Run Pipeline\n",
+      "(2017-06-03 07:52:14)<< DONE (45.0s)\n",
+      "(2017-06-03 07:52:14)>> Analyze...\n",
+      "((954700, 1), (950913, 1), 3787L, 2, '0.0074% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>glasgow coma scale verbal</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>ord</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>no_units</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>950913</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>5</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>No verbal response (&gt;2 yrs); no vocal response...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>465193</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                                  glasgow coma scale verbal\n",
+       "status                                                     known\n",
+       "variable_type                                                ord\n",
+       "units                                                   no_units\n",
+       "count                                                     950913\n",
+       "unique                                                         5\n",
+       "top            No verbal response (>2 yrs); no vocal response...\n",
+       "freq                                                      465193"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 07:52:14)<< DONE (0.0s)\n",
+      "(2017-06-03 07:52:14)>> Joining!\n",
+      "(2017-06-03 07:52:51)<< DONE (37.0s)\n",
+      "(2017-06-03 07:52:51) DONE (83.0s)\n",
+      "(2017-06-03 07:52:51) normal saline\n",
+      "(2017-06-03 07:52:51)>> Open Extract\n",
+      "(2017-06-03 07:52:51)<< DONE (0.0s)\n",
+      "(2017-06-03 07:52:51)>> Run Pipeline\n",
+      "(2017-06-03 08:01:38)<< DONE (527.0s)\n",
+      "(2017-06-03 08:01:38)>> Analyze...\n",
+      "((817373, 1), (504874, 2), 265615L, 8, '0.0405% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">normal saline</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>49173.000000</td>\n",
+       "      <td>456484.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>389.563178</td>\n",
+       "      <td>75.626948</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>380.287765</td>\n",
+       "      <td>217.512467</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>-906.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>100.000000</td>\n",
+       "      <td>6.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>250.000000</td>\n",
+       "      <td>15.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>500.000000</td>\n",
+       "      <td>62.204886</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>11000.000000</td>\n",
+       "      <td>51947.999400</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         normal saline               \n",
+       "status                known               \n",
+       "variable_type            qn               \n",
+       "units                    mL          mL/hr\n",
+       "count          49173.000000  456484.000000\n",
+       "mean             389.563178      75.626948\n",
+       "std              380.287765     217.512467\n",
+       "min                0.000000    -906.000000\n",
+       "25%              100.000000       6.000000\n",
+       "50%              250.000000      15.000000\n",
+       "75%              500.000000      62.204886\n",
+       "max            11000.000000   51947.999400"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 08:01:38)<< DONE (0.0s)\n",
+      "(2017-06-03 08:01:38)>> Joining!\n",
+      "(2017-06-03 08:02:15)<< DONE (37.0s)\n",
+      "(2017-06-03 08:02:15) DONE (564.0s)\n",
+      "(2017-06-03 08:02:15) lactated ringers\n",
+      "(2017-06-03 08:02:15)>> Open Extract\n",
+      "(2017-06-03 08:02:15)<< DONE (0.0s)\n",
+      "(2017-06-03 08:02:15)>> Run Pipeline\n",
+      "(2017-06-03 08:02:57)<< DONE (42.0s)\n",
+      "(2017-06-03 08:02:57)>> Analyze...\n",
+      "((504306, 1), (254175, 2), 19193L, 18, '0.1085% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">lactated ringers</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>248510.000000</td>\n",
+       "      <td>2161.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>204.109607</td>\n",
+       "      <td>289.877760</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>338.277593</td>\n",
+       "      <td>418.153805</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>15.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>100.000000</td>\n",
+       "      <td>99.994818</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>200.000000</td>\n",
+       "      <td>499.999980</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>60000.000000</td>\n",
+       "      <td>3923.333176</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         lactated ringers             \n",
+       "status                   known             \n",
+       "variable_type               qn             \n",
+       "units                       mL        mL/hr\n",
+       "count            248510.000000  2161.000000\n",
+       "mean                204.109607   289.877760\n",
+       "std                 338.277593   418.153805\n",
+       "min                   0.000000     0.000000\n",
+       "25%                  15.000000     0.000000\n",
+       "50%                 100.000000    99.994818\n",
+       "75%                 200.000000   499.999980\n",
+       "max               60000.000000  3923.333176"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 08:02:57)<< DONE (0.0s)\n",
+      "(2017-06-03 08:02:57)>> Joining!\n",
+      "(2017-06-03 08:03:34)<< DONE (37.0s)\n",
+      "(2017-06-03 08:03:34) DONE (79.0s)\n",
+      "(2017-06-03 08:03:34) norepinephrine\n",
+      "(2017-06-03 08:03:34)>> Open Extract\n",
+      "(2017-06-03 08:03:34)<< DONE (0.0s)\n",
+      "(2017-06-03 08:03:34)>> Run Pipeline\n",
+      "(2017-06-03 08:05:19)<< DONE (105.0s)\n",
+      "(2017-06-03 08:05:19)>> Analyze...\n",
+      "((1136938, 1), (389986, 2), 331666L, 17, '0.231% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">norepinephrine</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mcg/kg/min</th>\n",
+       "      <th>mcg/min</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>286781.000000</td>\n",
+       "      <td>14226.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>0.141207</td>\n",
+       "      <td>9.687762</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>0.343212</td>\n",
+       "      <td>14.889317</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>0.035000</td>\n",
+       "      <td>2.666667</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>0.080000</td>\n",
+       "      <td>6.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>0.180000</td>\n",
+       "      <td>12.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>50.000000</td>\n",
+       "      <td>250.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         norepinephrine              \n",
+       "status                 known              \n",
+       "variable_type             qn              \n",
+       "units             mcg/kg/min       mcg/min\n",
+       "count          286781.000000  14226.000000\n",
+       "mean                0.141207      9.687762\n",
+       "std                 0.343212     14.889317\n",
+       "min                 0.000000      0.000000\n",
+       "25%                 0.035000      2.666667\n",
+       "50%                 0.080000      6.000000\n",
+       "75%                 0.180000     12.000000\n",
+       "max                50.000000    250.000000"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 08:05:20)<< DONE (1.0s)\n",
+      "(2017-06-03 08:05:20)>> Joining!\n",
+      "(2017-06-03 08:05:58)<< DONE (38.0s)\n",
+      "(2017-06-03 08:05:58) DONE (144.0s)\n",
+      "(2017-06-03 08:05:58) vasopressin\n",
+      "(2017-06-03 08:05:58)>> Open Extract\n",
+      "(2017-06-03 08:05:58)<< DONE (0.0s)\n",
+      "(2017-06-03 08:05:58)>> Run Pipeline\n",
+      "(2017-06-03 08:06:20)<< DONE (22.0s)\n",
+      "(2017-06-03 08:06:20)>> Analyze...\n",
+      "((339184, 1), (110333, 2), 16608L, 8, '0.3406% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">vasopressin</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>units</th>\n",
+       "      <th>units/min</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>57371.000000</td>\n",
+       "      <td>98872.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>2.517366</td>\n",
+       "      <td>0.992521</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>4.842854</td>\n",
+       "      <td>1.291858</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>1.800000</td>\n",
+       "      <td>0.040000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>2.400000</td>\n",
+       "      <td>0.044000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>2.400000</td>\n",
+       "      <td>2.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>722.400000</td>\n",
+       "      <td>50.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label           vasopressin              \n",
+       "status                known              \n",
+       "variable_type            qn              \n",
+       "units                 units     units/min\n",
+       "count          57371.000000  98872.000000\n",
+       "mean               2.517366      0.992521\n",
+       "std                4.842854      1.291858\n",
+       "min                0.000000      0.000000\n",
+       "25%                1.800000      0.040000\n",
+       "50%                2.400000      0.044000\n",
+       "75%                2.400000      2.400000\n",
+       "max              722.400000     50.000000"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 08:06:20)<< DONE (0.0s)\n",
+      "(2017-06-03 08:06:20)>> Joining!\n",
+      "(2017-06-03 08:06:56)<< DONE (36.0s)\n",
+      "(2017-06-03 08:06:56) DONE (58.0s)\n",
+      "(2017-06-03 08:06:56) hemoglobin\n",
+      "(2017-06-03 08:06:56)>> Open Extract\n",
+      "(2017-06-03 08:06:56)<< DONE (0.0s)\n",
+      "(2017-06-03 08:06:56)>> Run Pipeline\n",
+      "(2017-06-03 08:07:52)<< DONE (56.0s)\n",
+      "(2017-06-03 08:07:52)>> Analyze...\n",
+      "((1167921, 1), (671087, 1), 641393L, 7, '0.0123% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>hemoglobin</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>g/dL</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>526528.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>10.351784</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>1.980592</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>9.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>10.100000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>11.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>130.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label             hemoglobin\n",
+       "status                 known\n",
+       "variable_type             qn\n",
+       "units                   g/dL\n",
+       "count          526528.000000\n",
+       "mean               10.351784\n",
+       "std                 1.980592\n",
+       "min                 0.000000\n",
+       "25%                 9.000000\n",
+       "50%                10.100000\n",
+       "75%                11.400000\n",
+       "max               130.000000"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 08:07:52)<< DONE (0.0s)\n",
+      "(2017-06-03 08:07:52)>> Joining!\n",
+      "(2017-06-03 08:08:36)<< DONE (44.0s)\n",
+      "(2017-06-03 08:08:36) DONE (100.0s)\n",
+      "(2017-06-03 08:08:36) lactate\n",
+      "(2017-06-03 08:08:36)>> Open Extract\n",
+      "(2017-06-03 08:08:37)<< DONE (1.0s)\n",
+      "(2017-06-03 08:08:37)>> Run Pipeline\n",
+      "(2017-06-03 08:08:52)<< DONE (15.0s)\n",
+      "(2017-06-03 08:08:52)>> Analyze...\n",
+      "((393608, 1), (177439, 1), 216244L, 33, '0.0962% records')\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th>lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>mmol/L</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>177364.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>8.286749</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>2374.466306</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>1.200000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>1.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>2.900000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>999999.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                lactate\n",
+       "status                 known\n",
+       "variable_type             qn\n",
+       "units                 mmol/L\n",
+       "count          177364.000000\n",
+       "mean                8.286749\n",
+       "std              2374.466306\n",
+       "min                 0.000000\n",
+       "25%                 1.200000\n",
+       "50%                 1.800000\n",
+       "75%                 2.900000\n",
+       "max            999999.000000"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-03 08:08:52)<< DONE (0.0s)\n",
+      "(2017-06-03 08:08:52)>> Joining!\n",
+      "(2017-06-03 08:09:35)<< DONE (43.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>heart rate</th>\n",
+       "      <th>blood pressure systolic</th>\n",
+       "      <th>blood pressure diastolic</th>\n",
+       "      <th>blood pressure mean</th>\n",
+       "      <th>respiratory rate</th>\n",
+       "      <th>temperature body</th>\n",
+       "      <th>oxygen saturation pulse oximetry</th>\n",
+       "      <th>weight body</th>\n",
+       "      <th>output urine</th>\n",
+       "      <th>glasgow coma scale motor</th>\n",
+       "      <th>...</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">normal saline</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">lactated ringers</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">norepinephrine</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">vasopressin</th>\n",
+       "      <th>hemoglobin</th>\n",
+       "      <th>lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>...</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>ord</th>\n",
+       "      <th>...</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th>beats/min</th>\n",
+       "      <th>mmHg</th>\n",
+       "      <th>mmHg</th>\n",
+       "      <th>mmHg</th>\n",
+       "      <th>insp/min</th>\n",
+       "      <th>degF</th>\n",
+       "      <th>percent</th>\n",
+       "      <th>kg</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th>...</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "      <th>mcg/kg/min</th>\n",
+       "      <th>mcg/min</th>\n",
+       "      <th>units</th>\n",
+       "      <th>units/min</th>\n",
+       "      <th>g/dL</th>\n",
+       "      <th>mmol/L</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"10\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 09:22:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>13.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 12:50:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 12:55:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>6.996487</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 12:57:00</th>\n",
+       "      <td>122.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>14.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:00:00</th>\n",
+       "      <td>118.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>22.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:01:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>192.0</td>\n",
+       "      <td>100.0</td>\n",
+       "      <td>122.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>499.999980</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:49:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>300.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:50:00</th>\n",
+       "      <td>118.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>22.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>10 rows × 22 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      heart rate blood pressure systolic  \\\n",
+       "status                          known                   known   \n",
+       "variable_type                      qn                      qn   \n",
+       "units                       beats/min                    mmHg   \n",
+       "id     datetime                                                 \n",
+       "100001 2117-09-11 09:22:00        NaN                     NaN   \n",
+       "       2117-09-11 09:32:00        NaN                     NaN   \n",
+       "       2117-09-11 12:50:00        NaN                     NaN   \n",
+       "       2117-09-11 12:55:00        NaN                     NaN   \n",
+       "       2117-09-11 12:57:00      122.0                     NaN   \n",
+       "       2117-09-11 13:00:00      118.0                     NaN   \n",
+       "       2117-09-11 13:01:00        NaN                   192.0   \n",
+       "       2117-09-11 13:48:00        NaN                     NaN   \n",
+       "       2117-09-11 13:49:00        NaN                     NaN   \n",
+       "       2117-09-11 13:50:00      118.0                     NaN   \n",
+       "\n",
+       "label                      blood pressure diastolic blood pressure mean  \\\n",
+       "status                                        known               known   \n",
+       "variable_type                                    qn                  qn   \n",
+       "units                                          mmHg                mmHg   \n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:22:00                      NaN                 NaN   \n",
+       "       2117-09-11 09:32:00                      NaN                 NaN   \n",
+       "       2117-09-11 12:50:00                      NaN                 NaN   \n",
+       "       2117-09-11 12:55:00                      NaN                 NaN   \n",
+       "       2117-09-11 12:57:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:00:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:01:00                    100.0               122.0   \n",
+       "       2117-09-11 13:48:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:49:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:50:00                      NaN                 NaN   \n",
+       "\n",
+       "label                      respiratory rate temperature body  \\\n",
+       "status                                known            known   \n",
+       "variable_type                            qn               qn   \n",
+       "units                              insp/min             degF   \n",
+       "id     datetime                                                \n",
+       "100001 2117-09-11 09:22:00              NaN              NaN   \n",
+       "       2117-09-11 09:32:00              NaN              NaN   \n",
+       "       2117-09-11 12:50:00              NaN              NaN   \n",
+       "       2117-09-11 12:55:00              NaN              NaN   \n",
+       "       2117-09-11 12:57:00             14.0              NaN   \n",
+       "       2117-09-11 13:00:00             22.0              NaN   \n",
+       "       2117-09-11 13:01:00              NaN              NaN   \n",
+       "       2117-09-11 13:48:00              NaN             98.0   \n",
+       "       2117-09-11 13:49:00              NaN              NaN   \n",
+       "       2117-09-11 13:50:00             22.0              NaN   \n",
+       "\n",
+       "label                      oxygen saturation pulse oximetry weight body  \\\n",
+       "status                                                known       known   \n",
+       "variable_type                                            qn          qn   \n",
+       "units                                               percent          kg   \n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:22:00                              NaN         NaN   \n",
+       "       2117-09-11 09:32:00                              NaN         NaN   \n",
+       "       2117-09-11 12:50:00                              NaN         NaN   \n",
+       "       2117-09-11 12:55:00                              NaN         NaN   \n",
+       "       2117-09-11 12:57:00                              NaN         NaN   \n",
+       "       2117-09-11 13:00:00                              NaN         NaN   \n",
+       "       2117-09-11 13:01:00                              NaN         NaN   \n",
+       "       2117-09-11 13:48:00                              NaN         NaN   \n",
+       "       2117-09-11 13:49:00                              NaN         NaN   \n",
+       "       2117-09-11 13:50:00                              NaN         NaN   \n",
+       "\n",
+       "label                      output urine glasgow coma scale motor   ...    \\\n",
+       "status                            known                    known   ...     \n",
+       "variable_type                        qn                      ord   ...     \n",
+       "units                                mL                 no_units   ...     \n",
+       "id     datetime                                                    ...     \n",
+       "100001 2117-09-11 09:22:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 09:32:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 12:50:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 12:55:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 12:57:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:01:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:48:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:49:00        300.0                      NaN   ...     \n",
+       "       2117-09-11 13:50:00          NaN                      NaN   ...     \n",
+       "\n",
+       "label                      normal saline             lactated ringers        \\\n",
+       "status                             known                        known         \n",
+       "variable_type                         qn                           qn         \n",
+       "units                                 mL       mL/hr               mL mL/hr   \n",
+       "id     datetime                                                               \n",
+       "100001 2117-09-11 09:22:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 09:32:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 12:50:00           NaN    5.000000              NaN   NaN   \n",
+       "       2117-09-11 12:55:00           NaN    6.996487              NaN   NaN   \n",
+       "       2117-09-11 12:57:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:01:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:48:00           NaN  499.999980              NaN   NaN   \n",
+       "       2117-09-11 13:49:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:50:00           NaN         NaN              NaN   NaN   \n",
+       "\n",
+       "label                      norepinephrine         vasopressin            \\\n",
+       "status                              known               known             \n",
+       "variable_type                          qn                  qn             \n",
+       "units                          mcg/kg/min mcg/min       units units/min   \n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:22:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 09:32:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 12:50:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 12:55:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 12:57:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:01:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:48:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:49:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:50:00            NaN     NaN         NaN       NaN   \n",
+       "\n",
+       "label                      hemoglobin lactate  \n",
+       "status                          known   known  \n",
+       "variable_type                      qn      qn  \n",
+       "units                            g/dL  mmol/L  \n",
+       "id     datetime                                \n",
+       "100001 2117-09-11 09:22:00       13.0     NaN  \n",
+       "       2117-09-11 09:32:00        NaN     1.9  \n",
+       "       2117-09-11 12:50:00        NaN     NaN  \n",
+       "       2117-09-11 12:55:00        NaN     NaN  \n",
+       "       2117-09-11 12:57:00        NaN     NaN  \n",
+       "       2117-09-11 13:00:00        NaN     NaN  \n",
+       "       2117-09-11 13:01:00        NaN     NaN  \n",
+       "       2117-09-11 13:48:00        NaN     NaN  \n",
+       "       2117-09-11 13:49:00        NaN     NaN  \n",
+       "       2117-09-11 13:50:00        NaN     NaN  \n",
+       "\n",
+       "[10 rows x 22 columns]"
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "reload(logger)\n",
+    "simple_data = data_dict.get_panel_defintions(12) #12 is \"simple data\"\n",
+    "labels = simple_data.label.unique().tolist()\n",
+    "\n",
+    "df_final = None\n",
+    "for label in labels:\n",
+    "    logger.log(label,new_level=True)\n",
+    "    logger.log('Open Extract')\n",
+    "    df_extract = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n",
+    "\n",
+    "    logger.log('Run Pipeline')\n",
+    "    all_pipeline.set_params(transform__add_level__level_val=label)\n",
+    "    df = all_pipeline.transform(df_extract)\n",
+    "    \n",
+    "    logger.log('Analyze...')\n",
+    "    print utils.data_loss(df_extract.set_index('id').value.to_frame(),df)\n",
+    "    display(df.describe())\n",
+    "\n",
+    "    logger.log('Joining!')\n",
+    "\n",
+    "    if df_final is None: df_final = df\n",
+    "    else: \n",
+    "        df_final = df_final.join(df,how='outer')\n",
+    "        del df\n",
+    "    logger.end_log_level()\n",
+    "\n",
+    "df_final.head(10)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>heart rate</th>\n",
+       "      <th>blood pressure systolic</th>\n",
+       "      <th>blood pressure diastolic</th>\n",
+       "      <th>blood pressure mean</th>\n",
+       "      <th>respiratory rate</th>\n",
+       "      <th>temperature body</th>\n",
+       "      <th>oxygen saturation pulse oximetry</th>\n",
+       "      <th>weight body</th>\n",
+       "      <th>output urine</th>\n",
+       "      <th>glasgow coma scale motor</th>\n",
+       "      <th>...</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">normal saline</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">lactated ringers</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">norepinephrine</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">vasopressin</th>\n",
+       "      <th>hemoglobin</th>\n",
+       "      <th>lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>...</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">known</th>\n",
+       "      <th>known</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>ord</th>\n",
+       "      <th>...</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th>beats/min</th>\n",
+       "      <th>mmHg</th>\n",
+       "      <th>mmHg</th>\n",
+       "      <th>mmHg</th>\n",
+       "      <th>insp/min</th>\n",
+       "      <th>degF</th>\n",
+       "      <th>percent</th>\n",
+       "      <th>kg</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th>...</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "      <th>mL</th>\n",
+       "      <th>mL/hr</th>\n",
+       "      <th>mcg/kg/min</th>\n",
+       "      <th>mcg/min</th>\n",
+       "      <th>units</th>\n",
+       "      <th>units/min</th>\n",
+       "      <th>g/dL</th>\n",
+       "      <th>mmol/L</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"30\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 09:22:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>13.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 12:50:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 12:55:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>6.996487</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 12:57:00</th>\n",
+       "      <td>122.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>14.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:00:00</th>\n",
+       "      <td>118.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>22.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:01:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>192.0</td>\n",
+       "      <td>100.0</td>\n",
+       "      <td>122.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>499.999980</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:49:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>300.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 13:50:00</th>\n",
+       "      <td>118.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>22.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 14:00:00</th>\n",
+       "      <td>118.0</td>\n",
+       "      <td>165.0</td>\n",
+       "      <td>85.0</td>\n",
+       "      <td>103.0</td>\n",
+       "      <td>15.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>8.990600</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 15:00:00</th>\n",
+       "      <td>110.0</td>\n",
+       "      <td>119.0</td>\n",
+       "      <td>64.0</td>\n",
+       "      <td>76.0</td>\n",
+       "      <td>15.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 15:48:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>999.999960</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 15:59:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>199.999998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:00:00</th>\n",
+       "      <td>104.0</td>\n",
+       "      <td>169.0</td>\n",
+       "      <td>84.0</td>\n",
+       "      <td>105.0</td>\n",
+       "      <td>16.0</td>\n",
+       "      <td>97.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:02:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:11:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>40.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:12:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.992476</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 17:00:00</th>\n",
+       "      <td>101.0</td>\n",
+       "      <td>110.0</td>\n",
+       "      <td>62.0</td>\n",
+       "      <td>75.0</td>\n",
+       "      <td>15.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 18:00:00</th>\n",
+       "      <td>112.0</td>\n",
+       "      <td>170.0</td>\n",
+       "      <td>86.0</td>\n",
+       "      <td>106.0</td>\n",
+       "      <td>16.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 18:34:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>400.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:00:00</th>\n",
+       "      <td>108.0</td>\n",
+       "      <td>179.0</td>\n",
+       "      <td>88.0</td>\n",
+       "      <td>110.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:31:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>11.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 20:00:00</th>\n",
+       "      <td>116.0</td>\n",
+       "      <td>183.0</td>\n",
+       "      <td>91.0</td>\n",
+       "      <td>114.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 21:00:00</th>\n",
+       "      <td>117.0</td>\n",
+       "      <td>189.0</td>\n",
+       "      <td>98.0</td>\n",
+       "      <td>121.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 21:12:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.396080</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 21:16:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5.012718</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <td>124.0</td>\n",
+       "      <td>180.0</td>\n",
+       "      <td>88.0</td>\n",
+       "      <td>110.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>200.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:10:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:25:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>500.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"30\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-09 09:00:00</th>\n",
+       "      <td>79.0</td>\n",
+       "      <td>130.0</td>\n",
+       "      <td>48.0</td>\n",
+       "      <td>69.0</td>\n",
+       "      <td>25.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>350.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 10:00:00</th>\n",
+       "      <td>81.0</td>\n",
+       "      <td>123.0</td>\n",
+       "      <td>64.0</td>\n",
+       "      <td>80.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 11:00:00</th>\n",
+       "      <td>89.0</td>\n",
+       "      <td>115.0</td>\n",
+       "      <td>57.0</td>\n",
+       "      <td>70.0</td>\n",
+       "      <td>16.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 12:00:00</th>\n",
+       "      <td>72.0</td>\n",
+       "      <td>119.0</td>\n",
+       "      <td>45.0</td>\n",
+       "      <td>65.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>98.3</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 13:00:00</th>\n",
+       "      <td>82.0</td>\n",
+       "      <td>156.0</td>\n",
+       "      <td>58.0</td>\n",
+       "      <td>78.0</td>\n",
+       "      <td>22.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 14:00:00</th>\n",
+       "      <td>74.0</td>\n",
+       "      <td>128.0</td>\n",
+       "      <td>53.0</td>\n",
+       "      <td>72.0</td>\n",
+       "      <td>28.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 15:00:00</th>\n",
+       "      <td>69.0</td>\n",
+       "      <td>129.0</td>\n",
+       "      <td>49.0</td>\n",
+       "      <td>69.0</td>\n",
+       "      <td>26.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 16:00:00</th>\n",
+       "      <td>71.0</td>\n",
+       "      <td>133.0</td>\n",
+       "      <td>46.0</td>\n",
+       "      <td>70.0</td>\n",
+       "      <td>27.0</td>\n",
+       "      <td>98.0</td>\n",
+       "      <td>94.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>400.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 17:00:00</th>\n",
+       "      <td>68.0</td>\n",
+       "      <td>150.0</td>\n",
+       "      <td>55.0</td>\n",
+       "      <td>79.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 18:00:00</th>\n",
+       "      <td>90.0</td>\n",
+       "      <td>146.0</td>\n",
+       "      <td>53.0</td>\n",
+       "      <td>79.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 19:00:00</th>\n",
+       "      <td>78.0</td>\n",
+       "      <td>134.0</td>\n",
+       "      <td>50.0</td>\n",
+       "      <td>72.0</td>\n",
+       "      <td>26.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 20:00:00</th>\n",
+       "      <td>82.0</td>\n",
+       "      <td>142.0</td>\n",
+       "      <td>52.0</td>\n",
+       "      <td>75.0</td>\n",
+       "      <td>23.0</td>\n",
+       "      <td>97.4</td>\n",
+       "      <td>95.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>480.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 21:00:00</th>\n",
+       "      <td>81.0</td>\n",
+       "      <td>132.0</td>\n",
+       "      <td>50.0</td>\n",
+       "      <td>70.0</td>\n",
+       "      <td>29.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 22:00:00</th>\n",
+       "      <td>72.0</td>\n",
+       "      <td>112.0</td>\n",
+       "      <td>48.0</td>\n",
+       "      <td>62.0</td>\n",
+       "      <td>25.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 23:00:00</th>\n",
+       "      <td>65.0</td>\n",
+       "      <td>129.0</td>\n",
+       "      <td>42.0</td>\n",
+       "      <td>66.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 00:00:00</th>\n",
+       "      <td>80.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>25.0</td>\n",
+       "      <td>97.4</td>\n",
+       "      <td>94.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 00:01:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>128.0</td>\n",
+       "      <td>59.0</td>\n",
+       "      <td>75.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 01:00:00</th>\n",
+       "      <td>80.0</td>\n",
+       "      <td>124.0</td>\n",
+       "      <td>59.0</td>\n",
+       "      <td>75.0</td>\n",
+       "      <td>26.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 02:00:00</th>\n",
+       "      <td>76.0</td>\n",
+       "      <td>130.0</td>\n",
+       "      <td>49.0</td>\n",
+       "      <td>68.0</td>\n",
+       "      <td>26.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>350.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 02:28:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>12.6</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 03:00:00</th>\n",
+       "      <td>72.0</td>\n",
+       "      <td>126.0</td>\n",
+       "      <td>37.0</td>\n",
+       "      <td>61.0</td>\n",
+       "      <td>27.0</td>\n",
+       "      <td>97.4</td>\n",
+       "      <td>91.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 04:00:00</th>\n",
+       "      <td>66.0</td>\n",
+       "      <td>126.0</td>\n",
+       "      <td>31.0</td>\n",
+       "      <td>52.0</td>\n",
+       "      <td>26.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 05:00:00</th>\n",
+       "      <td>66.0</td>\n",
+       "      <td>129.0</td>\n",
+       "      <td>39.0</td>\n",
+       "      <td>63.0</td>\n",
+       "      <td>27.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>330.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 06:00:00</th>\n",
+       "      <td>65.0</td>\n",
+       "      <td>143.0</td>\n",
+       "      <td>47.0</td>\n",
+       "      <td>71.0</td>\n",
+       "      <td>19.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>92.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 07:00:00</th>\n",
+       "      <td>79.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>28.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>92.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 08:00:00</th>\n",
+       "      <td>69.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>98.1</td>\n",
+       "      <td>96.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>200.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 09:00:00</th>\n",
+       "      <td>79.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>93.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 09:10:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>128.0</td>\n",
+       "      <td>81.0</td>\n",
+       "      <td>89.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 10:00:00</th>\n",
+       "      <td>72.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>26.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>200.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 11:00:00</th>\n",
+       "      <td>72.0</td>\n",
+       "      <td>144.0</td>\n",
+       "      <td>123.0</td>\n",
+       "      <td>128.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>...</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>10071464 rows × 22 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      heart rate blood pressure systolic  \\\n",
+       "status                          known                   known   \n",
+       "variable_type                      qn                      qn   \n",
+       "units                       beats/min                    mmHg   \n",
+       "id     datetime                                                 \n",
+       "100001 2117-09-11 09:22:00        NaN                     NaN   \n",
+       "       2117-09-11 09:32:00        NaN                     NaN   \n",
+       "       2117-09-11 12:50:00        NaN                     NaN   \n",
+       "       2117-09-11 12:55:00        NaN                     NaN   \n",
+       "       2117-09-11 12:57:00      122.0                     NaN   \n",
+       "       2117-09-11 13:00:00      118.0                     NaN   \n",
+       "       2117-09-11 13:01:00        NaN                   192.0   \n",
+       "       2117-09-11 13:48:00        NaN                     NaN   \n",
+       "       2117-09-11 13:49:00        NaN                     NaN   \n",
+       "       2117-09-11 13:50:00      118.0                     NaN   \n",
+       "       2117-09-11 14:00:00      118.0                   165.0   \n",
+       "       2117-09-11 15:00:00      110.0                   119.0   \n",
+       "       2117-09-11 15:48:00        NaN                     NaN   \n",
+       "       2117-09-11 15:59:00        NaN                     NaN   \n",
+       "       2117-09-11 16:00:00      104.0                   169.0   \n",
+       "       2117-09-11 16:02:00        NaN                     NaN   \n",
+       "       2117-09-11 16:11:00        NaN                     NaN   \n",
+       "       2117-09-11 16:12:00        NaN                     NaN   \n",
+       "       2117-09-11 17:00:00      101.0                   110.0   \n",
+       "       2117-09-11 18:00:00      112.0                   170.0   \n",
+       "       2117-09-11 18:34:00        NaN                     NaN   \n",
+       "       2117-09-11 19:00:00      108.0                   179.0   \n",
+       "       2117-09-11 19:31:00        NaN                     NaN   \n",
+       "       2117-09-11 20:00:00      116.0                   183.0   \n",
+       "       2117-09-11 21:00:00      117.0                   189.0   \n",
+       "       2117-09-11 21:12:00        NaN                     NaN   \n",
+       "       2117-09-11 21:16:00        NaN                     NaN   \n",
+       "       2117-09-11 22:00:00      124.0                   180.0   \n",
+       "       2117-09-11 22:10:00        NaN                     NaN   \n",
+       "       2117-09-11 22:25:00        NaN                     NaN   \n",
+       "...                               ...                     ...   \n",
+       "199999 2136-04-09 09:00:00       79.0                   130.0   \n",
+       "       2136-04-09 10:00:00       81.0                   123.0   \n",
+       "       2136-04-09 11:00:00       89.0                   115.0   \n",
+       "       2136-04-09 12:00:00       72.0                   119.0   \n",
+       "       2136-04-09 13:00:00       82.0                   156.0   \n",
+       "       2136-04-09 14:00:00       74.0                   128.0   \n",
+       "       2136-04-09 15:00:00       69.0                   129.0   \n",
+       "       2136-04-09 16:00:00       71.0                   133.0   \n",
+       "       2136-04-09 17:00:00       68.0                   150.0   \n",
+       "       2136-04-09 18:00:00       90.0                   146.0   \n",
+       "       2136-04-09 19:00:00       78.0                   134.0   \n",
+       "       2136-04-09 20:00:00       82.0                   142.0   \n",
+       "       2136-04-09 21:00:00       81.0                   132.0   \n",
+       "       2136-04-09 22:00:00       72.0                   112.0   \n",
+       "       2136-04-09 23:00:00       65.0                   129.0   \n",
+       "       2136-04-10 00:00:00       80.0                     NaN   \n",
+       "       2136-04-10 00:01:00        NaN                   128.0   \n",
+       "       2136-04-10 01:00:00       80.0                   124.0   \n",
+       "       2136-04-10 02:00:00       76.0                   130.0   \n",
+       "       2136-04-10 02:28:00        NaN                     NaN   \n",
+       "       2136-04-10 03:00:00       72.0                   126.0   \n",
+       "       2136-04-10 04:00:00       66.0                   126.0   \n",
+       "       2136-04-10 05:00:00       66.0                   129.0   \n",
+       "       2136-04-10 06:00:00       65.0                   143.0   \n",
+       "       2136-04-10 07:00:00       79.0                     NaN   \n",
+       "       2136-04-10 08:00:00       69.0                     NaN   \n",
+       "       2136-04-10 09:00:00       79.0                     NaN   \n",
+       "       2136-04-10 09:10:00        NaN                   128.0   \n",
+       "       2136-04-10 10:00:00       72.0                     NaN   \n",
+       "       2136-04-10 11:00:00       72.0                   144.0   \n",
+       "\n",
+       "label                      blood pressure diastolic blood pressure mean  \\\n",
+       "status                                        known               known   \n",
+       "variable_type                                    qn                  qn   \n",
+       "units                                          mmHg                mmHg   \n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:22:00                      NaN                 NaN   \n",
+       "       2117-09-11 09:32:00                      NaN                 NaN   \n",
+       "       2117-09-11 12:50:00                      NaN                 NaN   \n",
+       "       2117-09-11 12:55:00                      NaN                 NaN   \n",
+       "       2117-09-11 12:57:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:00:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:01:00                    100.0               122.0   \n",
+       "       2117-09-11 13:48:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:49:00                      NaN                 NaN   \n",
+       "       2117-09-11 13:50:00                      NaN                 NaN   \n",
+       "       2117-09-11 14:00:00                     85.0               103.0   \n",
+       "       2117-09-11 15:00:00                     64.0                76.0   \n",
+       "       2117-09-11 15:48:00                      NaN                 NaN   \n",
+       "       2117-09-11 15:59:00                      NaN                 NaN   \n",
+       "       2117-09-11 16:00:00                     84.0               105.0   \n",
+       "       2117-09-11 16:02:00                      NaN                 NaN   \n",
+       "       2117-09-11 16:11:00                      NaN                 NaN   \n",
+       "       2117-09-11 16:12:00                      NaN                 NaN   \n",
+       "       2117-09-11 17:00:00                     62.0                75.0   \n",
+       "       2117-09-11 18:00:00                     86.0               106.0   \n",
+       "       2117-09-11 18:34:00                      NaN                 NaN   \n",
+       "       2117-09-11 19:00:00                     88.0               110.0   \n",
+       "       2117-09-11 19:31:00                      NaN                 NaN   \n",
+       "       2117-09-11 20:00:00                     91.0               114.0   \n",
+       "       2117-09-11 21:00:00                     98.0               121.0   \n",
+       "       2117-09-11 21:12:00                      NaN                 NaN   \n",
+       "       2117-09-11 21:16:00                      NaN                 NaN   \n",
+       "       2117-09-11 22:00:00                     88.0               110.0   \n",
+       "       2117-09-11 22:10:00                      NaN                 NaN   \n",
+       "       2117-09-11 22:25:00                      NaN                 NaN   \n",
+       "...                                             ...                 ...   \n",
+       "199999 2136-04-09 09:00:00                     48.0                69.0   \n",
+       "       2136-04-09 10:00:00                     64.0                80.0   \n",
+       "       2136-04-09 11:00:00                     57.0                70.0   \n",
+       "       2136-04-09 12:00:00                     45.0                65.0   \n",
+       "       2136-04-09 13:00:00                     58.0                78.0   \n",
+       "       2136-04-09 14:00:00                     53.0                72.0   \n",
+       "       2136-04-09 15:00:00                     49.0                69.0   \n",
+       "       2136-04-09 16:00:00                     46.0                70.0   \n",
+       "       2136-04-09 17:00:00                     55.0                79.0   \n",
+       "       2136-04-09 18:00:00                     53.0                79.0   \n",
+       "       2136-04-09 19:00:00                     50.0                72.0   \n",
+       "       2136-04-09 20:00:00                     52.0                75.0   \n",
+       "       2136-04-09 21:00:00                     50.0                70.0   \n",
+       "       2136-04-09 22:00:00                     48.0                62.0   \n",
+       "       2136-04-09 23:00:00                     42.0                66.0   \n",
+       "       2136-04-10 00:00:00                      NaN                 NaN   \n",
+       "       2136-04-10 00:01:00                     59.0                75.0   \n",
+       "       2136-04-10 01:00:00                     59.0                75.0   \n",
+       "       2136-04-10 02:00:00                     49.0                68.0   \n",
+       "       2136-04-10 02:28:00                      NaN                 NaN   \n",
+       "       2136-04-10 03:00:00                     37.0                61.0   \n",
+       "       2136-04-10 04:00:00                     31.0                52.0   \n",
+       "       2136-04-10 05:00:00                     39.0                63.0   \n",
+       "       2136-04-10 06:00:00                     47.0                71.0   \n",
+       "       2136-04-10 07:00:00                      NaN                 NaN   \n",
+       "       2136-04-10 08:00:00                      NaN                 NaN   \n",
+       "       2136-04-10 09:00:00                      NaN                 NaN   \n",
+       "       2136-04-10 09:10:00                     81.0                89.0   \n",
+       "       2136-04-10 10:00:00                      NaN                 NaN   \n",
+       "       2136-04-10 11:00:00                    123.0               128.0   \n",
+       "\n",
+       "label                      respiratory rate temperature body  \\\n",
+       "status                                known            known   \n",
+       "variable_type                            qn               qn   \n",
+       "units                              insp/min             degF   \n",
+       "id     datetime                                                \n",
+       "100001 2117-09-11 09:22:00              NaN              NaN   \n",
+       "       2117-09-11 09:32:00              NaN              NaN   \n",
+       "       2117-09-11 12:50:00              NaN              NaN   \n",
+       "       2117-09-11 12:55:00              NaN              NaN   \n",
+       "       2117-09-11 12:57:00             14.0              NaN   \n",
+       "       2117-09-11 13:00:00             22.0              NaN   \n",
+       "       2117-09-11 13:01:00              NaN              NaN   \n",
+       "       2117-09-11 13:48:00              NaN             98.0   \n",
+       "       2117-09-11 13:49:00              NaN              NaN   \n",
+       "       2117-09-11 13:50:00             22.0              NaN   \n",
+       "       2117-09-11 14:00:00             15.0              NaN   \n",
+       "       2117-09-11 15:00:00             15.0              NaN   \n",
+       "       2117-09-11 15:48:00              NaN              NaN   \n",
+       "       2117-09-11 15:59:00              NaN              NaN   \n",
+       "       2117-09-11 16:00:00             16.0             97.9   \n",
+       "       2117-09-11 16:02:00              NaN              NaN   \n",
+       "       2117-09-11 16:11:00              NaN              NaN   \n",
+       "       2117-09-11 16:12:00              NaN              NaN   \n",
+       "       2117-09-11 17:00:00             15.0              NaN   \n",
+       "       2117-09-11 18:00:00             16.0              NaN   \n",
+       "       2117-09-11 18:34:00              NaN              NaN   \n",
+       "       2117-09-11 19:00:00              NaN             99.5   \n",
+       "       2117-09-11 19:31:00              NaN              NaN   \n",
+       "       2117-09-11 20:00:00              NaN              NaN   \n",
+       "       2117-09-11 21:00:00              NaN              NaN   \n",
+       "       2117-09-11 21:12:00              NaN              NaN   \n",
+       "       2117-09-11 21:16:00              NaN              NaN   \n",
+       "       2117-09-11 22:00:00              NaN            100.0   \n",
+       "       2117-09-11 22:10:00              NaN              NaN   \n",
+       "       2117-09-11 22:25:00              NaN              NaN   \n",
+       "...                                     ...              ...   \n",
+       "199999 2136-04-09 09:00:00             25.0              NaN   \n",
+       "       2136-04-09 10:00:00             24.0              NaN   \n",
+       "       2136-04-09 11:00:00             16.0              NaN   \n",
+       "       2136-04-09 12:00:00             24.0             98.3   \n",
+       "       2136-04-09 13:00:00             22.0              NaN   \n",
+       "       2136-04-09 14:00:00             28.0              NaN   \n",
+       "       2136-04-09 15:00:00             26.0              NaN   \n",
+       "       2136-04-09 16:00:00             27.0             98.0   \n",
+       "       2136-04-09 17:00:00             24.0              NaN   \n",
+       "       2136-04-09 18:00:00             24.0              NaN   \n",
+       "       2136-04-09 19:00:00             26.0              NaN   \n",
+       "       2136-04-09 20:00:00             23.0             97.4   \n",
+       "       2136-04-09 21:00:00             29.0              NaN   \n",
+       "       2136-04-09 22:00:00             25.0              NaN   \n",
+       "       2136-04-09 23:00:00             24.0              NaN   \n",
+       "       2136-04-10 00:00:00             25.0             97.4   \n",
+       "       2136-04-10 00:01:00              NaN              NaN   \n",
+       "       2136-04-10 01:00:00             26.0              NaN   \n",
+       "       2136-04-10 02:00:00             26.0              NaN   \n",
+       "       2136-04-10 02:28:00              NaN              NaN   \n",
+       "       2136-04-10 03:00:00             27.0             97.4   \n",
+       "       2136-04-10 04:00:00             26.0              NaN   \n",
+       "       2136-04-10 05:00:00             27.0              NaN   \n",
+       "       2136-04-10 06:00:00             19.0              NaN   \n",
+       "       2136-04-10 07:00:00             28.0              NaN   \n",
+       "       2136-04-10 08:00:00             24.0             98.1   \n",
+       "       2136-04-10 09:00:00             24.0              NaN   \n",
+       "       2136-04-10 09:10:00              NaN              NaN   \n",
+       "       2136-04-10 10:00:00             26.0              NaN   \n",
+       "       2136-04-10 11:00:00             24.0              NaN   \n",
+       "\n",
+       "label                      oxygen saturation pulse oximetry weight body  \\\n",
+       "status                                                known       known   \n",
+       "variable_type                                            qn          qn   \n",
+       "units                                               percent          kg   \n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:22:00                              NaN         NaN   \n",
+       "       2117-09-11 09:32:00                              NaN         NaN   \n",
+       "       2117-09-11 12:50:00                              NaN         NaN   \n",
+       "       2117-09-11 12:55:00                              NaN         NaN   \n",
+       "       2117-09-11 12:57:00                              NaN         NaN   \n",
+       "       2117-09-11 13:00:00                              NaN         NaN   \n",
+       "       2117-09-11 13:01:00                              NaN         NaN   \n",
+       "       2117-09-11 13:48:00                              NaN         NaN   \n",
+       "       2117-09-11 13:49:00                              NaN         NaN   \n",
+       "       2117-09-11 13:50:00                              NaN         NaN   \n",
+       "       2117-09-11 14:00:00                              NaN         NaN   \n",
+       "       2117-09-11 15:00:00                              NaN         NaN   \n",
+       "       2117-09-11 15:48:00                              NaN         NaN   \n",
+       "       2117-09-11 15:59:00                              NaN         NaN   \n",
+       "       2117-09-11 16:00:00                              NaN         NaN   \n",
+       "       2117-09-11 16:02:00                            100.0         NaN   \n",
+       "       2117-09-11 16:11:00                              NaN         NaN   \n",
+       "       2117-09-11 16:12:00                              NaN         NaN   \n",
+       "       2117-09-11 17:00:00                             97.0         NaN   \n",
+       "       2117-09-11 18:00:00                             98.0         NaN   \n",
+       "       2117-09-11 18:34:00                              NaN         NaN   \n",
+       "       2117-09-11 19:00:00                              NaN         NaN   \n",
+       "       2117-09-11 19:31:00                              NaN         NaN   \n",
+       "       2117-09-11 20:00:00                             97.0         NaN   \n",
+       "       2117-09-11 21:00:00                              NaN         NaN   \n",
+       "       2117-09-11 21:12:00                              NaN         NaN   \n",
+       "       2117-09-11 21:16:00                              NaN         NaN   \n",
+       "       2117-09-11 22:00:00                              NaN         NaN   \n",
+       "       2117-09-11 22:10:00                             97.0         NaN   \n",
+       "       2117-09-11 22:25:00                              NaN         NaN   \n",
+       "...                                                     ...         ...   \n",
+       "199999 2136-04-09 09:00:00                             95.0         NaN   \n",
+       "       2136-04-09 10:00:00                             94.0         NaN   \n",
+       "       2136-04-09 11:00:00                             94.0         NaN   \n",
+       "       2136-04-09 12:00:00                             93.0         NaN   \n",
+       "       2136-04-09 13:00:00                             94.0         NaN   \n",
+       "       2136-04-09 14:00:00                             93.0         NaN   \n",
+       "       2136-04-09 15:00:00                             93.0         NaN   \n",
+       "       2136-04-09 16:00:00                             94.0         NaN   \n",
+       "       2136-04-09 17:00:00                             94.0         NaN   \n",
+       "       2136-04-09 18:00:00                             93.0         NaN   \n",
+       "       2136-04-09 19:00:00                             93.0         NaN   \n",
+       "       2136-04-09 20:00:00                             95.0         NaN   \n",
+       "       2136-04-09 21:00:00                             93.0         NaN   \n",
+       "       2136-04-09 22:00:00                             97.0         NaN   \n",
+       "       2136-04-09 23:00:00                             96.0         NaN   \n",
+       "       2136-04-10 00:00:00                             94.0         NaN   \n",
+       "       2136-04-10 00:01:00                              NaN         NaN   \n",
+       "       2136-04-10 01:00:00                             95.0         NaN   \n",
+       "       2136-04-10 02:00:00                             93.0         NaN   \n",
+       "       2136-04-10 02:28:00                              NaN         NaN   \n",
+       "       2136-04-10 03:00:00                             91.0         NaN   \n",
+       "       2136-04-10 04:00:00                             95.0         NaN   \n",
+       "       2136-04-10 05:00:00                             96.0         NaN   \n",
+       "       2136-04-10 06:00:00                             92.0         NaN   \n",
+       "       2136-04-10 07:00:00                             92.0         NaN   \n",
+       "       2136-04-10 08:00:00                             96.0         NaN   \n",
+       "       2136-04-10 09:00:00                             93.0         NaN   \n",
+       "       2136-04-10 09:10:00                              NaN         NaN   \n",
+       "       2136-04-10 10:00:00                             97.0         NaN   \n",
+       "       2136-04-10 11:00:00                             96.0         NaN   \n",
+       "\n",
+       "label                      output urine glasgow coma scale motor   ...    \\\n",
+       "status                            known                    known   ...     \n",
+       "variable_type                        qn                      ord   ...     \n",
+       "units                                mL                 no_units   ...     \n",
+       "id     datetime                                                    ...     \n",
+       "100001 2117-09-11 09:22:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 09:32:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 12:50:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 12:55:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 12:57:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:01:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:48:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 13:49:00        300.0                      NaN   ...     \n",
+       "       2117-09-11 13:50:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 14:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 15:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 15:48:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 15:59:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 16:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 16:02:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 16:11:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 16:12:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 17:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 18:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 18:34:00        400.0                      NaN   ...     \n",
+       "       2117-09-11 19:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 19:31:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 20:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 21:00:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 21:12:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 21:16:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 22:00:00        200.0                      NaN   ...     \n",
+       "       2117-09-11 22:10:00          NaN                      NaN   ...     \n",
+       "       2117-09-11 22:25:00          NaN                      NaN   ...     \n",
+       "...                                 ...                      ...   ...     \n",
+       "199999 2136-04-09 09:00:00        350.0                      NaN   ...     \n",
+       "       2136-04-09 10:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 11:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 12:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 13:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 14:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 15:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 16:00:00        400.0                      NaN   ...     \n",
+       "       2136-04-09 17:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 18:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 19:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 20:00:00        480.0                      NaN   ...     \n",
+       "       2136-04-09 21:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 22:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-09 23:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 00:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 00:01:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 01:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 02:00:00        350.0                      NaN   ...     \n",
+       "       2136-04-10 02:28:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 03:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 04:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 05:00:00        330.0                      NaN   ...     \n",
+       "       2136-04-10 06:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 07:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 08:00:00        200.0                      NaN   ...     \n",
+       "       2136-04-10 09:00:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 09:10:00          NaN                      NaN   ...     \n",
+       "       2136-04-10 10:00:00        200.0                      NaN   ...     \n",
+       "       2136-04-10 11:00:00          NaN                      NaN   ...     \n",
+       "\n",
+       "label                      normal saline             lactated ringers        \\\n",
+       "status                             known                        known         \n",
+       "variable_type                         qn                           qn         \n",
+       "units                                 mL       mL/hr               mL mL/hr   \n",
+       "id     datetime                                                               \n",
+       "100001 2117-09-11 09:22:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 09:32:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 12:50:00           NaN    5.000000              NaN   NaN   \n",
+       "       2117-09-11 12:55:00           NaN    6.996487              NaN   NaN   \n",
+       "       2117-09-11 12:57:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:01:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:48:00           NaN  499.999980              NaN   NaN   \n",
+       "       2117-09-11 13:49:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 13:50:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 14:00:00           NaN    8.990600              NaN   NaN   \n",
+       "       2117-09-11 15:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 15:48:00           NaN  999.999960              NaN   NaN   \n",
+       "       2117-09-11 15:59:00           NaN  199.999998              NaN   NaN   \n",
+       "       2117-09-11 16:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 16:02:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 16:11:00           NaN   40.000000              NaN   NaN   \n",
+       "       2117-09-11 16:12:00           NaN    4.992476              NaN   NaN   \n",
+       "       2117-09-11 17:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 18:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 18:34:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 19:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 19:31:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 20:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 21:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 21:12:00           NaN    3.396080              NaN   NaN   \n",
+       "       2117-09-11 21:16:00           NaN    5.012718              NaN   NaN   \n",
+       "       2117-09-11 22:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 22:10:00           NaN         NaN              NaN   NaN   \n",
+       "       2117-09-11 22:25:00         500.0         NaN              NaN   NaN   \n",
+       "...                                  ...         ...              ...   ...   \n",
+       "199999 2136-04-09 09:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 10:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 11:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 12:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 13:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 14:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 15:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 16:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 17:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 18:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 19:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 20:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 21:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 22:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-09 23:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 00:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 00:01:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 01:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 02:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 02:28:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 03:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 04:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 05:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 06:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 07:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 08:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 09:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 09:10:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 10:00:00           NaN         NaN              NaN   NaN   \n",
+       "       2136-04-10 11:00:00           NaN         NaN              NaN   NaN   \n",
+       "\n",
+       "label                      norepinephrine         vasopressin            \\\n",
+       "status                              known               known             \n",
+       "variable_type                          qn                  qn             \n",
+       "units                          mcg/kg/min mcg/min       units units/min   \n",
+       "id     datetime                                                           \n",
+       "100001 2117-09-11 09:22:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 09:32:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 12:50:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 12:55:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 12:57:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:01:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:48:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:49:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 13:50:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 14:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 15:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 15:48:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 15:59:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 16:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 16:02:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 16:11:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 16:12:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 17:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 18:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 18:34:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 19:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 19:31:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 20:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 21:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 21:12:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 21:16:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 22:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 22:10:00            NaN     NaN         NaN       NaN   \n",
+       "       2117-09-11 22:25:00            NaN     NaN         NaN       NaN   \n",
+       "...                                   ...     ...         ...       ...   \n",
+       "199999 2136-04-09 09:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 10:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 11:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 12:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 13:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 14:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 15:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 16:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 17:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 18:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 19:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 20:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 21:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 22:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-09 23:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 00:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 00:01:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 01:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 02:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 02:28:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 03:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 04:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 05:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 06:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 07:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 08:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 09:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 09:10:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 10:00:00            NaN     NaN         NaN       NaN   \n",
+       "       2136-04-10 11:00:00            NaN     NaN         NaN       NaN   \n",
+       "\n",
+       "label                      hemoglobin lactate  \n",
+       "status                          known   known  \n",
+       "variable_type                      qn      qn  \n",
+       "units                            g/dL  mmol/L  \n",
+       "id     datetime                                \n",
+       "100001 2117-09-11 09:22:00       13.0     NaN  \n",
+       "       2117-09-11 09:32:00        NaN     1.9  \n",
+       "       2117-09-11 12:50:00        NaN     NaN  \n",
+       "       2117-09-11 12:55:00        NaN     NaN  \n",
+       "       2117-09-11 12:57:00        NaN     NaN  \n",
+       "       2117-09-11 13:00:00        NaN     NaN  \n",
+       "       2117-09-11 13:01:00        NaN     NaN  \n",
+       "       2117-09-11 13:48:00        NaN     NaN  \n",
+       "       2117-09-11 13:49:00        NaN     NaN  \n",
+       "       2117-09-11 13:50:00        NaN     NaN  \n",
+       "       2117-09-11 14:00:00        NaN     NaN  \n",
+       "       2117-09-11 15:00:00        NaN     NaN  \n",
+       "       2117-09-11 15:48:00        NaN     NaN  \n",
+       "       2117-09-11 15:59:00        NaN     NaN  \n",
+       "       2117-09-11 16:00:00        NaN     NaN  \n",
+       "       2117-09-11 16:02:00        NaN     NaN  \n",
+       "       2117-09-11 16:11:00        NaN     NaN  \n",
+       "       2117-09-11 16:12:00        NaN     NaN  \n",
+       "       2117-09-11 17:00:00        NaN     NaN  \n",
+       "       2117-09-11 18:00:00        NaN     NaN  \n",
+       "       2117-09-11 18:34:00        NaN     NaN  \n",
+       "       2117-09-11 19:00:00        NaN     NaN  \n",
+       "       2117-09-11 19:31:00       11.0     NaN  \n",
+       "       2117-09-11 20:00:00        NaN     NaN  \n",
+       "       2117-09-11 21:00:00        NaN     NaN  \n",
+       "       2117-09-11 21:12:00        NaN     NaN  \n",
+       "       2117-09-11 21:16:00        NaN     NaN  \n",
+       "       2117-09-11 22:00:00        NaN     NaN  \n",
+       "       2117-09-11 22:10:00        NaN     NaN  \n",
+       "       2117-09-11 22:25:00        NaN     NaN  \n",
+       "...                               ...     ...  \n",
+       "199999 2136-04-09 09:00:00        NaN     NaN  \n",
+       "       2136-04-09 10:00:00        NaN     NaN  \n",
+       "       2136-04-09 11:00:00        NaN     NaN  \n",
+       "       2136-04-09 12:00:00        NaN     NaN  \n",
+       "       2136-04-09 13:00:00        NaN     NaN  \n",
+       "       2136-04-09 14:00:00        NaN     NaN  \n",
+       "       2136-04-09 15:00:00        NaN     NaN  \n",
+       "       2136-04-09 16:00:00        NaN     NaN  \n",
+       "       2136-04-09 17:00:00        NaN     NaN  \n",
+       "       2136-04-09 18:00:00        NaN     NaN  \n",
+       "       2136-04-09 19:00:00        NaN     NaN  \n",
+       "       2136-04-09 20:00:00        NaN     NaN  \n",
+       "       2136-04-09 21:00:00        NaN     NaN  \n",
+       "       2136-04-09 22:00:00        NaN     NaN  \n",
+       "       2136-04-09 23:00:00        NaN     NaN  \n",
+       "       2136-04-10 00:00:00        NaN     NaN  \n",
+       "       2136-04-10 00:01:00        NaN     NaN  \n",
+       "       2136-04-10 01:00:00        NaN     NaN  \n",
+       "       2136-04-10 02:00:00        NaN     NaN  \n",
+       "       2136-04-10 02:28:00       12.6     NaN  \n",
+       "       2136-04-10 03:00:00        NaN     NaN  \n",
+       "       2136-04-10 04:00:00        NaN     NaN  \n",
+       "       2136-04-10 05:00:00        NaN     NaN  \n",
+       "       2136-04-10 06:00:00        NaN     NaN  \n",
+       "       2136-04-10 07:00:00        NaN     NaN  \n",
+       "       2136-04-10 08:00:00        NaN     NaN  \n",
+       "       2136-04-10 09:00:00        NaN     NaN  \n",
+       "       2136-04-10 09:10:00        NaN     NaN  \n",
+       "       2136-04-10 10:00:00        NaN     NaN  \n",
+       "       2136-04-10 11:00:00        NaN     NaN  \n",
+       "\n",
+       "[10071464 rows x 22 columns]"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "utils.save_df(df_final,hdf5_fname,'cleaned/test1')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Prepare for ML\n",
+    "\n",
+    "\n",
+    "1. All categories to numeric representations\n",
+    "2. Segment, add to index\n",
+    "3. Transform into features (FeatureUnion)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "intro_pipeline = Pipeline([\n",
+    "        ('transform',mimic_transform),\n",
+    "        ('format',standard_pipeline),\n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th colspan=\"3\" halign=\"left\">nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">mmol/L</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th colspan=\"3\" halign=\"left\">no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>50813</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>818</th>\n",
+       "      <th>1531</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>50813(mmol/L)</th>\n",
+       "      <th>818(mmol/L)</th>\n",
+       "      <th>1531(mmol/L)</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>100001</th>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100003</th>\n",
+       "      <th>2150-04-17 19:12:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100006</th>\n",
+       "      <th>2108-04-08 10:58:00</th>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100007</th>\n",
+       "      <th>2145-03-31 00:44:00</th>\n",
+       "      <td>3.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2145-04-02 14:10:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      lactate                                          \\\n",
+       "status                       known                   unknown                 \n",
+       "variable_type                   qn                        qn           nom   \n",
+       "units                       mmol/L                  no_units      no_units   \n",
+       "description                  50813 225668  818 1531   225668 50813(mmol/L)   \n",
+       "id     datetime                                                              \n",
+       "100001 2117-09-11 09:32:00     1.9    NaN  NaN  NaN      NaN           NaN   \n",
+       "100003 2150-04-17 19:12:00     1.1    1.1  NaN  NaN      NaN           NaN   \n",
+       "100006 2108-04-08 10:58:00     4.5    NaN  4.5  NaN      NaN           NaN   \n",
+       "100007 2145-03-31 00:44:00     3.1    NaN  NaN  NaN      NaN           NaN   \n",
+       "       2145-04-02 14:10:00     1.9    NaN  NaN  NaN      NaN           NaN   \n",
+       "\n",
+       "label                                                \n",
+       "status                                               \n",
+       "variable_type                                        \n",
+       "units                                                \n",
+       "description                818(mmol/L) 1531(mmol/L)  \n",
+       "id     datetime                                      \n",
+       "100001 2117-09-11 09:32:00         NaN          NaN  \n",
+       "100003 2150-04-17 19:12:00         NaN          NaN  \n",
+       "100006 2108-04-08 10:58:00         NaN          NaN  \n",
+       "100007 2145-03-31 00:44:00         NaN          NaN  \n",
+       "       2145-04-02 14:10:00         NaN          NaN  "
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "label = 'lactate'\n",
+    "df_extract = utils.open_df(hdf5_fname,'extract/{}'.format(label))\n",
+    "df_cleaned = intro_pipeline.transform(df_extract)\n",
+    "df_cleaned.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th colspan=\"3\" halign=\"left\">nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">mmol/L</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th colspan=\"3\" halign=\"left\">no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>50813</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>818</th>\n",
+       "      <th>1531</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>50813(mmol/L)</th>\n",
+       "      <th>818(mmol/L)</th>\n",
+       "      <th>1531(mmol/L)</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>176767.000000</td>\n",
+       "      <td>69402.000000</td>\n",
+       "      <td>72916.000000</td>\n",
+       "      <td>63134.000000</td>\n",
+       "      <td>14.000000</td>\n",
+       "      <td>57</td>\n",
+       "      <td>57</td>\n",
+       "      <td>23</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34</td>\n",
+       "      <td>14</td>\n",
+       "      <td>8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>ERROR</td>\n",
+       "      <td>no data</td>\n",
+       "      <td>no data</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>18</td>\n",
+       "      <td>37</td>\n",
+       "      <td>9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>2.635120</td>\n",
+       "      <td>16.943607</td>\n",
+       "      <td>2.849300</td>\n",
+       "      <td>2.780338</td>\n",
+       "      <td>52.835714</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>2.590268</td>\n",
+       "      <td>3795.881233</td>\n",
+       "      <td>3.152031</td>\n",
+       "      <td>3.045527</td>\n",
+       "      <td>82.567153</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.050000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>1.200000</td>\n",
+       "      <td>1.200000</td>\n",
+       "      <td>1.200000</td>\n",
+       "      <td>1.200000</td>\n",
+       "      <td>1.175000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>1.800000</td>\n",
+       "      <td>1.800000</td>\n",
+       "      <td>1.800000</td>\n",
+       "      <td>1.800000</td>\n",
+       "      <td>3.400000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>2.900000</td>\n",
+       "      <td>2.900000</td>\n",
+       "      <td>3.100000</td>\n",
+       "      <td>3.000000</td>\n",
+       "      <td>115.400000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>36.000000</td>\n",
+       "      <td>999999.000000</td>\n",
+       "      <td>153.000000</td>\n",
+       "      <td>153.000000</td>\n",
+       "      <td>203.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                lactate                                             \\\n",
+       "status                 known                                              \n",
+       "variable_type             qn                                              \n",
+       "units                 mmol/L                                              \n",
+       "description            50813         225668           818          1531   \n",
+       "count          176767.000000   69402.000000  72916.000000  63134.000000   \n",
+       "unique                   NaN            NaN           NaN           NaN   \n",
+       "top                      NaN            NaN           NaN           NaN   \n",
+       "freq                     NaN            NaN           NaN           NaN   \n",
+       "mean                2.635120      16.943607      2.849300      2.780338   \n",
+       "std                 2.590268    3795.881233      3.152031      3.045527   \n",
+       "min                 0.000000       0.050000      0.000000      0.000000   \n",
+       "25%                 1.200000       1.200000      1.200000      1.200000   \n",
+       "50%                 1.800000       1.800000      1.800000      1.800000   \n",
+       "75%                 2.900000       2.900000      3.100000      3.000000   \n",
+       "max                36.000000  999999.000000    153.000000    153.000000   \n",
+       "\n",
+       "label                                                             \n",
+       "status            unknown                                         \n",
+       "variable_type          qn           nom                           \n",
+       "units            no_units      no_units                           \n",
+       "description        225668 50813(mmol/L) 818(mmol/L) 1531(mmol/L)  \n",
+       "count           14.000000            57          57           23  \n",
+       "unique                NaN            34          14            8  \n",
+       "top                   NaN         ERROR     no data      no data  \n",
+       "freq                  NaN            18          37            9  \n",
+       "mean            52.835714           NaN         NaN          NaN  \n",
+       "std             82.567153           NaN         NaN          NaN  \n",
+       "min              0.000000           NaN         NaN          NaN  \n",
+       "25%              1.175000           NaN         NaN          NaN  \n",
+       "50%              3.400000           NaN         NaN          NaN  \n",
+       "75%            115.400000           NaN         NaN          NaN  \n",
+       "max            203.000000           NaN         NaN          NaN  "
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_cleaned.describe(include='all')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"21\" halign=\"left\">lactate</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"17\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "      <th>qn</th>\n",
+       "      <th colspan=\"16\" halign=\"left\">nom</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">mmol/L</th>\n",
+       "      <th>no_units</th>\n",
+       "      <th colspan=\"16\" halign=\"left\">no_units</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>50813</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>818</th>\n",
+       "      <th>1531</th>\n",
+       "      <th>225668</th>\n",
+       "      <th>50813(mmol/L)_.</th>\n",
+       "      <th>50813(mmol/L)_5,0</th>\n",
+       "      <th>50813(mmol/L)_&gt;30</th>\n",
+       "      <th>50813(mmol/L)_&gt;30.0</th>\n",
+       "      <th>50813(mmol/L)_CLOTTED</th>\n",
+       "      <th>...</th>\n",
+       "      <th>818(mmol/L)_VOIDED</th>\n",
+       "      <th>818(mmol/L)_no data</th>\n",
+       "      <th>1531(mmol/L)_.</th>\n",
+       "      <th>1531(mmol/L)_5,0</th>\n",
+       "      <th>1531(mmol/L)_&gt;30</th>\n",
+       "      <th>1531(mmol/L)_&gt;30.0</th>\n",
+       "      <th>1531(mmol/L)_CLOTTED</th>\n",
+       "      <th>1531(mmol/L)_ERROR</th>\n",
+       "      <th>1531(mmol/L)_VOIDED</th>\n",
+       "      <th>1531(mmol/L)_no data</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>100001</th>\n",
+       "      <th>2117-09-11 09:32:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100003</th>\n",
+       "      <th>2150-04-17 19:12:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100006</th>\n",
+       "      <th>2108-04-08 10:58:00</th>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100007</th>\n",
+       "      <th>2145-03-31 00:44:00</th>\n",
+       "      <td>3.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2145-04-02 14:10:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100009</th>\n",
+       "      <th>2162-05-17 13:19:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2162-05-17 17:14:00</th>\n",
+       "      <td>1.5</td>\n",
+       "      <td>1.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">100010</th>\n",
+       "      <th>2109-12-10 10:25:00</th>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 12:11:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:05:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-10 13:58:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100011</th>\n",
+       "      <th>2177-08-29 04:44:00</th>\n",
+       "      <td>3.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-08-29 06:55:00</th>\n",
+       "      <td>2.3</td>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100012</th>\n",
+       "      <th>2177-03-14 07:38:00</th>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-14 11:42:00</th>\n",
+       "      <td>2.5</td>\n",
+       "      <td>2.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 08:05:00</th>\n",
+       "      <td>2.1</td>\n",
+       "      <td>2.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 14:01:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-03-15 21:42:00</th>\n",
+       "      <td>1.8</td>\n",
+       "      <td>1.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100016</th>\n",
+       "      <th>2188-05-24 12:00:00</th>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100017</th>\n",
+       "      <th>2103-03-11 05:10:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">100018</th>\n",
+       "      <th>2176-08-29 15:29:00</th>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 09:23:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 10:19:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 11:29:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2176-08-30 12:40:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100020</th>\n",
+       "      <th>2142-11-30 21:54:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2142-12-03 00:17:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100024</th>\n",
+       "      <th>2170-09-19 10:25:00</th>\n",
+       "      <td>1.4</td>\n",
+       "      <td>1.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-19 16:33:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2170-09-20 02:04:00</th>\n",
+       "      <td>3.2</td>\n",
+       "      <td>3.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199976</th>\n",
+       "      <th>2182-02-14 11:15:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-16 03:57:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-19 03:59:00</th>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-20 03:31:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-21 04:55:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199979</th>\n",
+       "      <th>2182-02-06 09:17:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2182-02-06 14:16:00</th>\n",
+       "      <td>3.8</td>\n",
+       "      <td>3.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">199981</th>\n",
+       "      <th>2110-09-24 16:34:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-24 20:09:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2110-09-25 06:10:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>199987</th>\n",
+       "      <th>2175-05-19 16:30:00</th>\n",
+       "      <td>2.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"6\" valign=\"top\">199988</th>\n",
+       "      <th>2169-01-24 12:48:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 01:35:00</th>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 11:18:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 16:43:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-07 22:35:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2169-02-10 05:33:00</th>\n",
+       "      <td>1.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199993</th>\n",
+       "      <th>2161-11-12 23:14:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2161-11-13 03:46:00</th>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"4\" valign=\"top\">199994</th>\n",
+       "      <th>2188-07-07 21:23:00</th>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 03:09:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 04:13:00</th>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2188-07-08 06:20:00</th>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">199998</th>\n",
+       "      <th>2119-02-20 10:52:00</th>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>1.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 12:36:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:33:00</th>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 13:59:00</th>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>2.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 20:43:00</th>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>1.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-04 20:55:00</th>\n",
+       "      <td>1.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-06 15:29:00</th>\n",
+       "      <td>1.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>...</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "      <td>0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>177450 rows × 29 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      lactate                                            \\\n",
+       "status                       known                   unknown                   \n",
+       "variable_type                   qn                        qn             nom   \n",
+       "units                       mmol/L                  no_units        no_units   \n",
+       "description                  50813 225668  818 1531   225668 50813(mmol/L)_.   \n",
+       "id     datetime                                                                \n",
+       "100001 2117-09-11 09:32:00     1.9    NaN  NaN  NaN      NaN               0   \n",
+       "100003 2150-04-17 19:12:00     1.1    1.1  NaN  NaN      NaN               0   \n",
+       "100006 2108-04-08 10:58:00     4.5    NaN  4.5  NaN      NaN               0   \n",
+       "100007 2145-03-31 00:44:00     3.1    NaN  NaN  NaN      NaN               0   \n",
+       "       2145-04-02 14:10:00     1.9    NaN  NaN  NaN      NaN               0   \n",
+       "100009 2162-05-17 13:19:00     1.1    1.1  NaN  NaN      NaN               0   \n",
+       "       2162-05-17 17:14:00     1.5    1.5  NaN  NaN      NaN               0   \n",
+       "100010 2109-12-10 10:25:00     0.6    NaN  NaN  NaN      NaN               0   \n",
+       "       2109-12-10 12:11:00     0.9    NaN  NaN  NaN      NaN               0   \n",
+       "       2109-12-10 13:05:00     1.0    NaN  NaN  NaN      NaN               0   \n",
+       "       2109-12-10 13:58:00     0.8    NaN  NaN  NaN      NaN               0   \n",
+       "100011 2177-08-29 04:44:00     3.8    NaN  NaN  NaN      NaN               0   \n",
+       "       2177-08-29 06:55:00     2.3    2.3  NaN  NaN      NaN               0   \n",
+       "100012 2177-03-14 07:38:00     2.3    NaN  NaN  NaN      NaN               0   \n",
+       "       2177-03-14 11:42:00     2.5    2.5  NaN  NaN      NaN               0   \n",
+       "       2177-03-15 08:05:00     2.1    2.1  NaN  NaN      NaN               0   \n",
+       "       2177-03-15 14:01:00     2.6    2.6  NaN  NaN      NaN               0   \n",
+       "       2177-03-15 21:42:00     1.8    1.8  NaN  NaN      NaN               0   \n",
+       "100016 2188-05-24 12:00:00     2.0    NaN  NaN  NaN      NaN               0   \n",
+       "100017 2103-03-11 05:10:00     1.1    NaN  1.1  NaN      NaN               0   \n",
+       "100018 2176-08-29 15:29:00     1.3    NaN  NaN  NaN      NaN               0   \n",
+       "       2176-08-30 09:23:00     0.9    0.9  NaN  NaN      NaN               0   \n",
+       "       2176-08-30 10:19:00     1.0    1.0  NaN  NaN      NaN               0   \n",
+       "       2176-08-30 11:29:00     0.9    0.9  NaN  NaN      NaN               0   \n",
+       "       2176-08-30 12:40:00     1.1    1.1  NaN  NaN      NaN               0   \n",
+       "100020 2142-11-30 21:54:00     1.1    NaN  NaN  NaN      NaN               0   \n",
+       "       2142-12-03 00:17:00     1.0    NaN  NaN  NaN      NaN               0   \n",
+       "100024 2170-09-19 10:25:00     1.4    1.4  NaN  NaN      NaN               0   \n",
+       "       2170-09-19 16:33:00     2.6    2.6  NaN  NaN      NaN               0   \n",
+       "       2170-09-20 02:04:00     3.2    3.2  NaN  NaN      NaN               0   \n",
+       "...                            ...    ...  ...  ...      ...             ...   \n",
+       "199976 2182-02-14 11:15:00     0.8    NaN  0.8  NaN      NaN               0   \n",
+       "       2182-02-16 03:57:00     0.8    NaN  0.8  NaN      NaN               0   \n",
+       "       2182-02-19 03:59:00     0.8    NaN  0.8  NaN      NaN               0   \n",
+       "       2182-02-20 03:31:00     0.7    NaN  0.7  NaN      NaN               0   \n",
+       "       2182-02-21 04:55:00     0.9    NaN  0.9  NaN      NaN               0   \n",
+       "199979 2182-02-06 09:17:00     1.0    NaN  NaN  NaN      NaN               0   \n",
+       "       2182-02-06 14:16:00     3.8    3.8  NaN  NaN      NaN               0   \n",
+       "199981 2110-09-24 16:34:00     1.1    NaN  1.1  1.1      NaN               0   \n",
+       "       2110-09-24 20:09:00     1.0    NaN  1.0  1.0      NaN               0   \n",
+       "       2110-09-25 06:10:00     1.0    NaN  1.0  1.0      NaN               0   \n",
+       "199987 2175-05-19 16:30:00     2.3    NaN  NaN  NaN      NaN               0   \n",
+       "199988 2169-01-24 12:48:00     1.0    NaN  NaN  NaN      NaN               0   \n",
+       "       2169-02-07 01:35:00     1.6    NaN  1.6  NaN      NaN               0   \n",
+       "       2169-02-07 11:18:00     1.0    NaN  1.0  NaN      NaN               0   \n",
+       "       2169-02-07 16:43:00     1.0    NaN  1.0  NaN      NaN               0   \n",
+       "       2169-02-07 22:35:00     1.1    NaN  1.1  NaN      NaN               0   \n",
+       "       2169-02-10 05:33:00     1.4    NaN  NaN  NaN      NaN               0   \n",
+       "199993 2161-11-12 23:14:00     0.9    NaN  0.9  NaN      NaN               0   \n",
+       "       2161-11-13 03:46:00     0.9    NaN  0.9  NaN      NaN               0   \n",
+       "199994 2188-07-07 21:23:00     1.0    NaN  1.0  NaN      NaN               0   \n",
+       "       2188-07-08 03:09:00     0.7    NaN  0.7  NaN      NaN               0   \n",
+       "       2188-07-08 04:13:00     0.6    NaN  0.6  NaN      NaN               0   \n",
+       "       2188-07-08 06:20:00     0.7    NaN  0.7  NaN      NaN               0   \n",
+       "199998 2119-02-20 10:52:00     1.1    1.1  1.1  1.1      NaN               0   \n",
+       "       2119-02-20 12:36:00     1.9    1.9  1.9  1.9      NaN               0   \n",
+       "       2119-02-20 13:33:00     2.0    2.0  2.0  2.0      NaN               0   \n",
+       "       2119-02-20 13:59:00     2.6    2.6  2.6  2.6      NaN               0   \n",
+       "       2119-02-20 20:43:00     1.3    1.3  1.3  1.3      NaN               0   \n",
+       "199999 2136-04-04 20:55:00     1.9    NaN  NaN  NaN      NaN               0   \n",
+       "       2136-04-06 15:29:00     1.8    NaN  NaN  NaN      NaN               0   \n",
+       "\n",
+       "label                                                           \\\n",
+       "status                                                           \n",
+       "variable_type                                                    \n",
+       "units                                                            \n",
+       "description                50813(mmol/L)_5,0 50813(mmol/L)_>30   \n",
+       "id     datetime                                                  \n",
+       "100001 2117-09-11 09:32:00                 0                 0   \n",
+       "100003 2150-04-17 19:12:00                 0                 0   \n",
+       "100006 2108-04-08 10:58:00                 0                 0   \n",
+       "100007 2145-03-31 00:44:00                 0                 0   \n",
+       "       2145-04-02 14:10:00                 0                 0   \n",
+       "100009 2162-05-17 13:19:00                 0                 0   \n",
+       "       2162-05-17 17:14:00                 0                 0   \n",
+       "100010 2109-12-10 10:25:00                 0                 0   \n",
+       "       2109-12-10 12:11:00                 0                 0   \n",
+       "       2109-12-10 13:05:00                 0                 0   \n",
+       "       2109-12-10 13:58:00                 0                 0   \n",
+       "100011 2177-08-29 04:44:00                 0                 0   \n",
+       "       2177-08-29 06:55:00                 0                 0   \n",
+       "100012 2177-03-14 07:38:00                 0                 0   \n",
+       "       2177-03-14 11:42:00                 0                 0   \n",
+       "       2177-03-15 08:05:00                 0                 0   \n",
+       "       2177-03-15 14:01:00                 0                 0   \n",
+       "       2177-03-15 21:42:00                 0                 0   \n",
+       "100016 2188-05-24 12:00:00                 0                 0   \n",
+       "100017 2103-03-11 05:10:00                 0                 0   \n",
+       "100018 2176-08-29 15:29:00                 0                 0   \n",
+       "       2176-08-30 09:23:00                 0                 0   \n",
+       "       2176-08-30 10:19:00                 0                 0   \n",
+       "       2176-08-30 11:29:00                 0                 0   \n",
+       "       2176-08-30 12:40:00                 0                 0   \n",
+       "100020 2142-11-30 21:54:00                 0                 0   \n",
+       "       2142-12-03 00:17:00                 0                 0   \n",
+       "100024 2170-09-19 10:25:00                 0                 0   \n",
+       "       2170-09-19 16:33:00                 0                 0   \n",
+       "       2170-09-20 02:04:00                 0                 0   \n",
+       "...                                      ...               ...   \n",
+       "199976 2182-02-14 11:15:00                 0                 0   \n",
+       "       2182-02-16 03:57:00                 0                 0   \n",
+       "       2182-02-19 03:59:00                 0                 0   \n",
+       "       2182-02-20 03:31:00                 0                 0   \n",
+       "       2182-02-21 04:55:00                 0                 0   \n",
+       "199979 2182-02-06 09:17:00                 0                 0   \n",
+       "       2182-02-06 14:16:00                 0                 0   \n",
+       "199981 2110-09-24 16:34:00                 0                 0   \n",
+       "       2110-09-24 20:09:00                 0                 0   \n",
+       "       2110-09-25 06:10:00                 0                 0   \n",
+       "199987 2175-05-19 16:30:00                 0                 0   \n",
+       "199988 2169-01-24 12:48:00                 0                 0   \n",
+       "       2169-02-07 01:35:00                 0                 0   \n",
+       "       2169-02-07 11:18:00                 0                 0   \n",
+       "       2169-02-07 16:43:00                 0                 0   \n",
+       "       2169-02-07 22:35:00                 0                 0   \n",
+       "       2169-02-10 05:33:00                 0                 0   \n",
+       "199993 2161-11-12 23:14:00                 0                 0   \n",
+       "       2161-11-13 03:46:00                 0                 0   \n",
+       "199994 2188-07-07 21:23:00                 0                 0   \n",
+       "       2188-07-08 03:09:00                 0                 0   \n",
+       "       2188-07-08 04:13:00                 0                 0   \n",
+       "       2188-07-08 06:20:00                 0                 0   \n",
+       "199998 2119-02-20 10:52:00                 0                 0   \n",
+       "       2119-02-20 12:36:00                 0                 0   \n",
+       "       2119-02-20 13:33:00                 0                 0   \n",
+       "       2119-02-20 13:59:00                 0                 0   \n",
+       "       2119-02-20 20:43:00                 0                 0   \n",
+       "199999 2136-04-04 20:55:00                 0                 0   \n",
+       "       2136-04-06 15:29:00                 0                 0   \n",
+       "\n",
+       "label                                                                 \\\n",
+       "status                                                                 \n",
+       "variable_type                                                          \n",
+       "units                                                                  \n",
+       "description                50813(mmol/L)_>30.0 50813(mmol/L)_CLOTTED   \n",
+       "id     datetime                                                        \n",
+       "100001 2117-09-11 09:32:00                   0                     0   \n",
+       "100003 2150-04-17 19:12:00                   0                     0   \n",
+       "100006 2108-04-08 10:58:00                   0                     0   \n",
+       "100007 2145-03-31 00:44:00                   0                     0   \n",
+       "       2145-04-02 14:10:00                   0                     0   \n",
+       "100009 2162-05-17 13:19:00                   0                     0   \n",
+       "       2162-05-17 17:14:00                   0                     0   \n",
+       "100010 2109-12-10 10:25:00                   0                     0   \n",
+       "       2109-12-10 12:11:00                   0                     0   \n",
+       "       2109-12-10 13:05:00                   0                     0   \n",
+       "       2109-12-10 13:58:00                   0                     0   \n",
+       "100011 2177-08-29 04:44:00                   0                     0   \n",
+       "       2177-08-29 06:55:00                   0                     0   \n",
+       "100012 2177-03-14 07:38:00                   0                     0   \n",
+       "       2177-03-14 11:42:00                   0                     0   \n",
+       "       2177-03-15 08:05:00                   0                     0   \n",
+       "       2177-03-15 14:01:00                   0                     0   \n",
+       "       2177-03-15 21:42:00                   0                     0   \n",
+       "100016 2188-05-24 12:00:00                   0                     0   \n",
+       "100017 2103-03-11 05:10:00                   0                     0   \n",
+       "100018 2176-08-29 15:29:00                   0                     0   \n",
+       "       2176-08-30 09:23:00                   0                     0   \n",
+       "       2176-08-30 10:19:00                   0                     0   \n",
+       "       2176-08-30 11:29:00                   0                     0   \n",
+       "       2176-08-30 12:40:00                   0                     0   \n",
+       "100020 2142-11-30 21:54:00                   0                     0   \n",
+       "       2142-12-03 00:17:00                   0                     0   \n",
+       "100024 2170-09-19 10:25:00                   0                     0   \n",
+       "       2170-09-19 16:33:00                   0                     0   \n",
+       "       2170-09-20 02:04:00                   0                     0   \n",
+       "...                                        ...                   ...   \n",
+       "199976 2182-02-14 11:15:00                   0                     0   \n",
+       "       2182-02-16 03:57:00                   0                     0   \n",
+       "       2182-02-19 03:59:00                   0                     0   \n",
+       "       2182-02-20 03:31:00                   0                     0   \n",
+       "       2182-02-21 04:55:00                   0                     0   \n",
+       "199979 2182-02-06 09:17:00                   0                     0   \n",
+       "       2182-02-06 14:16:00                   0                     0   \n",
+       "199981 2110-09-24 16:34:00                   0                     0   \n",
+       "       2110-09-24 20:09:00                   0                     0   \n",
+       "       2110-09-25 06:10:00                   0                     0   \n",
+       "199987 2175-05-19 16:30:00                   0                     0   \n",
+       "199988 2169-01-24 12:48:00                   0                     0   \n",
+       "       2169-02-07 01:35:00                   0                     0   \n",
+       "       2169-02-07 11:18:00                   0                     0   \n",
+       "       2169-02-07 16:43:00                   0                     0   \n",
+       "       2169-02-07 22:35:00                   0                     0   \n",
+       "       2169-02-10 05:33:00                   0                     0   \n",
+       "199993 2161-11-12 23:14:00                   0                     0   \n",
+       "       2161-11-13 03:46:00                   0                     0   \n",
+       "199994 2188-07-07 21:23:00                   0                     0   \n",
+       "       2188-07-08 03:09:00                   0                     0   \n",
+       "       2188-07-08 04:13:00                   0                     0   \n",
+       "       2188-07-08 06:20:00                   0                     0   \n",
+       "199998 2119-02-20 10:52:00                   0                     0   \n",
+       "       2119-02-20 12:36:00                   0                     0   \n",
+       "       2119-02-20 13:33:00                   0                     0   \n",
+       "       2119-02-20 13:59:00                   0                     0   \n",
+       "       2119-02-20 20:43:00                   0                     0   \n",
+       "199999 2136-04-04 20:55:00                   0                     0   \n",
+       "       2136-04-06 15:29:00                   0                     0   \n",
+       "\n",
+       "label                              ...                              \\\n",
+       "status                             ...                               \n",
+       "variable_type                      ...                               \n",
+       "units                              ...                               \n",
+       "description                        ...          818(mmol/L)_VOIDED   \n",
+       "id     datetime                    ...                               \n",
+       "100001 2117-09-11 09:32:00         ...                           0   \n",
+       "100003 2150-04-17 19:12:00         ...                           0   \n",
+       "100006 2108-04-08 10:58:00         ...                           0   \n",
+       "100007 2145-03-31 00:44:00         ...                           0   \n",
+       "       2145-04-02 14:10:00         ...                           0   \n",
+       "100009 2162-05-17 13:19:00         ...                           0   \n",
+       "       2162-05-17 17:14:00         ...                           0   \n",
+       "100010 2109-12-10 10:25:00         ...                           0   \n",
+       "       2109-12-10 12:11:00         ...                           0   \n",
+       "       2109-12-10 13:05:00         ...                           0   \n",
+       "       2109-12-10 13:58:00         ...                           0   \n",
+       "100011 2177-08-29 04:44:00         ...                           0   \n",
+       "       2177-08-29 06:55:00         ...                           0   \n",
+       "100012 2177-03-14 07:38:00         ...                           0   \n",
+       "       2177-03-14 11:42:00         ...                           0   \n",
+       "       2177-03-15 08:05:00         ...                           0   \n",
+       "       2177-03-15 14:01:00         ...                           0   \n",
+       "       2177-03-15 21:42:00         ...                           0   \n",
+       "100016 2188-05-24 12:00:00         ...                           0   \n",
+       "100017 2103-03-11 05:10:00         ...                           0   \n",
+       "100018 2176-08-29 15:29:00         ...                           0   \n",
+       "       2176-08-30 09:23:00         ...                           0   \n",
+       "       2176-08-30 10:19:00         ...                           0   \n",
+       "       2176-08-30 11:29:00         ...                           0   \n",
+       "       2176-08-30 12:40:00         ...                           0   \n",
+       "100020 2142-11-30 21:54:00         ...                           0   \n",
+       "       2142-12-03 00:17:00         ...                           0   \n",
+       "100024 2170-09-19 10:25:00         ...                           0   \n",
+       "       2170-09-19 16:33:00         ...                           0   \n",
+       "       2170-09-20 02:04:00         ...                           0   \n",
+       "...                                ...                         ...   \n",
+       "199976 2182-02-14 11:15:00         ...                           0   \n",
+       "       2182-02-16 03:57:00         ...                           0   \n",
+       "       2182-02-19 03:59:00         ...                           0   \n",
+       "       2182-02-20 03:31:00         ...                           0   \n",
+       "       2182-02-21 04:55:00         ...                           0   \n",
+       "199979 2182-02-06 09:17:00         ...                           0   \n",
+       "       2182-02-06 14:16:00         ...                           0   \n",
+       "199981 2110-09-24 16:34:00         ...                           0   \n",
+       "       2110-09-24 20:09:00         ...                           0   \n",
+       "       2110-09-25 06:10:00         ...                           0   \n",
+       "199987 2175-05-19 16:30:00         ...                           0   \n",
+       "199988 2169-01-24 12:48:00         ...                           0   \n",
+       "       2169-02-07 01:35:00         ...                           0   \n",
+       "       2169-02-07 11:18:00         ...                           0   \n",
+       "       2169-02-07 16:43:00         ...                           0   \n",
+       "       2169-02-07 22:35:00         ...                           0   \n",
+       "       2169-02-10 05:33:00         ...                           0   \n",
+       "199993 2161-11-12 23:14:00         ...                           0   \n",
+       "       2161-11-13 03:46:00         ...                           0   \n",
+       "199994 2188-07-07 21:23:00         ...                           0   \n",
+       "       2188-07-08 03:09:00         ...                           0   \n",
+       "       2188-07-08 04:13:00         ...                           0   \n",
+       "       2188-07-08 06:20:00         ...                           0   \n",
+       "199998 2119-02-20 10:52:00         ...                           0   \n",
+       "       2119-02-20 12:36:00         ...                           0   \n",
+       "       2119-02-20 13:33:00         ...                           0   \n",
+       "       2119-02-20 13:59:00         ...                           0   \n",
+       "       2119-02-20 20:43:00         ...                           0   \n",
+       "199999 2136-04-04 20:55:00         ...                           0   \n",
+       "       2136-04-06 15:29:00         ...                           0   \n",
+       "\n",
+       "label                                                          \\\n",
+       "status                                                          \n",
+       "variable_type                                                   \n",
+       "units                                                           \n",
+       "description                818(mmol/L)_no data 1531(mmol/L)_.   \n",
+       "id     datetime                                                 \n",
+       "100001 2117-09-11 09:32:00                   0              0   \n",
+       "100003 2150-04-17 19:12:00                   0              0   \n",
+       "100006 2108-04-08 10:58:00                   0              0   \n",
+       "100007 2145-03-31 00:44:00                   0              0   \n",
+       "       2145-04-02 14:10:00                   0              0   \n",
+       "100009 2162-05-17 13:19:00                   0              0   \n",
+       "       2162-05-17 17:14:00                   0              0   \n",
+       "100010 2109-12-10 10:25:00                   0              0   \n",
+       "       2109-12-10 12:11:00                   0              0   \n",
+       "       2109-12-10 13:05:00                   0              0   \n",
+       "       2109-12-10 13:58:00                   0              0   \n",
+       "100011 2177-08-29 04:44:00                   0              0   \n",
+       "       2177-08-29 06:55:00                   0              0   \n",
+       "100012 2177-03-14 07:38:00                   0              0   \n",
+       "       2177-03-14 11:42:00                   0              0   \n",
+       "       2177-03-15 08:05:00                   0              0   \n",
+       "       2177-03-15 14:01:00                   0              0   \n",
+       "       2177-03-15 21:42:00                   0              0   \n",
+       "100016 2188-05-24 12:00:00                   0              0   \n",
+       "100017 2103-03-11 05:10:00                   0              0   \n",
+       "100018 2176-08-29 15:29:00                   0              0   \n",
+       "       2176-08-30 09:23:00                   0              0   \n",
+       "       2176-08-30 10:19:00                   0              0   \n",
+       "       2176-08-30 11:29:00                   0              0   \n",
+       "       2176-08-30 12:40:00                   0              0   \n",
+       "100020 2142-11-30 21:54:00                   0              0   \n",
+       "       2142-12-03 00:17:00                   0              0   \n",
+       "100024 2170-09-19 10:25:00                   0              0   \n",
+       "       2170-09-19 16:33:00                   0              0   \n",
+       "       2170-09-20 02:04:00                   0              0   \n",
+       "...                                        ...            ...   \n",
+       "199976 2182-02-14 11:15:00                   0              0   \n",
+       "       2182-02-16 03:57:00                   0              0   \n",
+       "       2182-02-19 03:59:00                   0              0   \n",
+       "       2182-02-20 03:31:00                   0              0   \n",
+       "       2182-02-21 04:55:00                   0              0   \n",
+       "199979 2182-02-06 09:17:00                   0              0   \n",
+       "       2182-02-06 14:16:00                   0              0   \n",
+       "199981 2110-09-24 16:34:00                   0              0   \n",
+       "       2110-09-24 20:09:00                   0              0   \n",
+       "       2110-09-25 06:10:00                   0              0   \n",
+       "199987 2175-05-19 16:30:00                   0              0   \n",
+       "199988 2169-01-24 12:48:00                   0              0   \n",
+       "       2169-02-07 01:35:00                   0              0   \n",
+       "       2169-02-07 11:18:00                   0              0   \n",
+       "       2169-02-07 16:43:00                   0              0   \n",
+       "       2169-02-07 22:35:00                   0              0   \n",
+       "       2169-02-10 05:33:00                   0              0   \n",
+       "199993 2161-11-12 23:14:00                   0              0   \n",
+       "       2161-11-13 03:46:00                   0              0   \n",
+       "199994 2188-07-07 21:23:00                   0              0   \n",
+       "       2188-07-08 03:09:00                   0              0   \n",
+       "       2188-07-08 04:13:00                   0              0   \n",
+       "       2188-07-08 06:20:00                   0              0   \n",
+       "199998 2119-02-20 10:52:00                   0              0   \n",
+       "       2119-02-20 12:36:00                   0              0   \n",
+       "       2119-02-20 13:33:00                   0              0   \n",
+       "       2119-02-20 13:59:00                   0              0   \n",
+       "       2119-02-20 20:43:00                   0              0   \n",
+       "199999 2136-04-04 20:55:00                   0              0   \n",
+       "       2136-04-06 15:29:00                   0              0   \n",
+       "\n",
+       "label                                                         \\\n",
+       "status                                                         \n",
+       "variable_type                                                  \n",
+       "units                                                          \n",
+       "description                1531(mmol/L)_5,0 1531(mmol/L)_>30   \n",
+       "id     datetime                                                \n",
+       "100001 2117-09-11 09:32:00                0                0   \n",
+       "100003 2150-04-17 19:12:00                0                0   \n",
+       "100006 2108-04-08 10:58:00                0                0   \n",
+       "100007 2145-03-31 00:44:00                0                0   \n",
+       "       2145-04-02 14:10:00                0                0   \n",
+       "100009 2162-05-17 13:19:00                0                0   \n",
+       "       2162-05-17 17:14:00                0                0   \n",
+       "100010 2109-12-10 10:25:00                0                0   \n",
+       "       2109-12-10 12:11:00                0                0   \n",
+       "       2109-12-10 13:05:00                0                0   \n",
+       "       2109-12-10 13:58:00                0                0   \n",
+       "100011 2177-08-29 04:44:00                0                0   \n",
+       "       2177-08-29 06:55:00                0                0   \n",
+       "100012 2177-03-14 07:38:00                0                0   \n",
+       "       2177-03-14 11:42:00                0                0   \n",
+       "       2177-03-15 08:05:00                0                0   \n",
+       "       2177-03-15 14:01:00                0                0   \n",
+       "       2177-03-15 21:42:00                0                0   \n",
+       "100016 2188-05-24 12:00:00                0                0   \n",
+       "100017 2103-03-11 05:10:00                0                0   \n",
+       "100018 2176-08-29 15:29:00                0                0   \n",
+       "       2176-08-30 09:23:00                0                0   \n",
+       "       2176-08-30 10:19:00                0                0   \n",
+       "       2176-08-30 11:29:00                0                0   \n",
+       "       2176-08-30 12:40:00                0                0   \n",
+       "100020 2142-11-30 21:54:00                0                0   \n",
+       "       2142-12-03 00:17:00                0                0   \n",
+       "100024 2170-09-19 10:25:00                0                0   \n",
+       "       2170-09-19 16:33:00                0                0   \n",
+       "       2170-09-20 02:04:00                0                0   \n",
+       "...                                     ...              ...   \n",
+       "199976 2182-02-14 11:15:00                0                0   \n",
+       "       2182-02-16 03:57:00                0                0   \n",
+       "       2182-02-19 03:59:00                0                0   \n",
+       "       2182-02-20 03:31:00                0                0   \n",
+       "       2182-02-21 04:55:00                0                0   \n",
+       "199979 2182-02-06 09:17:00                0                0   \n",
+       "       2182-02-06 14:16:00                0                0   \n",
+       "199981 2110-09-24 16:34:00                0                0   \n",
+       "       2110-09-24 20:09:00                0                0   \n",
+       "       2110-09-25 06:10:00                0                0   \n",
+       "199987 2175-05-19 16:30:00                0                0   \n",
+       "199988 2169-01-24 12:48:00                0                0   \n",
+       "       2169-02-07 01:35:00                0                0   \n",
+       "       2169-02-07 11:18:00                0                0   \n",
+       "       2169-02-07 16:43:00                0                0   \n",
+       "       2169-02-07 22:35:00                0                0   \n",
+       "       2169-02-10 05:33:00                0                0   \n",
+       "199993 2161-11-12 23:14:00                0                0   \n",
+       "       2161-11-13 03:46:00                0                0   \n",
+       "199994 2188-07-07 21:23:00                0                0   \n",
+       "       2188-07-08 03:09:00                0                0   \n",
+       "       2188-07-08 04:13:00                0                0   \n",
+       "       2188-07-08 06:20:00                0                0   \n",
+       "199998 2119-02-20 10:52:00                0                0   \n",
+       "       2119-02-20 12:36:00                0                0   \n",
+       "       2119-02-20 13:33:00                0                0   \n",
+       "       2119-02-20 13:59:00                0                0   \n",
+       "       2119-02-20 20:43:00                0                0   \n",
+       "199999 2136-04-04 20:55:00                0                0   \n",
+       "       2136-04-06 15:29:00                0                0   \n",
+       "\n",
+       "label                                                               \\\n",
+       "status                                                               \n",
+       "variable_type                                                        \n",
+       "units                                                                \n",
+       "description                1531(mmol/L)_>30.0 1531(mmol/L)_CLOTTED   \n",
+       "id     datetime                                                      \n",
+       "100001 2117-09-11 09:32:00                  0                    0   \n",
+       "100003 2150-04-17 19:12:00                  0                    0   \n",
+       "100006 2108-04-08 10:58:00                  0                    0   \n",
+       "100007 2145-03-31 00:44:00                  0                    0   \n",
+       "       2145-04-02 14:10:00                  0                    0   \n",
+       "100009 2162-05-17 13:19:00                  0                    0   \n",
+       "       2162-05-17 17:14:00                  0                    0   \n",
+       "100010 2109-12-10 10:25:00                  0                    0   \n",
+       "       2109-12-10 12:11:00                  0                    0   \n",
+       "       2109-12-10 13:05:00                  0                    0   \n",
+       "       2109-12-10 13:58:00                  0                    0   \n",
+       "100011 2177-08-29 04:44:00                  0                    0   \n",
+       "       2177-08-29 06:55:00                  0                    0   \n",
+       "100012 2177-03-14 07:38:00                  0                    0   \n",
+       "       2177-03-14 11:42:00                  0                    0   \n",
+       "       2177-03-15 08:05:00                  0                    0   \n",
+       "       2177-03-15 14:01:00                  0                    0   \n",
+       "       2177-03-15 21:42:00                  0                    0   \n",
+       "100016 2188-05-24 12:00:00                  0                    0   \n",
+       "100017 2103-03-11 05:10:00                  0                    0   \n",
+       "100018 2176-08-29 15:29:00                  0                    0   \n",
+       "       2176-08-30 09:23:00                  0                    0   \n",
+       "       2176-08-30 10:19:00                  0                    0   \n",
+       "       2176-08-30 11:29:00                  0                    0   \n",
+       "       2176-08-30 12:40:00                  0                    0   \n",
+       "100020 2142-11-30 21:54:00                  0                    0   \n",
+       "       2142-12-03 00:17:00                  0                    0   \n",
+       "100024 2170-09-19 10:25:00                  0                    0   \n",
+       "       2170-09-19 16:33:00                  0                    0   \n",
+       "       2170-09-20 02:04:00                  0                    0   \n",
+       "...                                       ...                  ...   \n",
+       "199976 2182-02-14 11:15:00                  0                    0   \n",
+       "       2182-02-16 03:57:00                  0                    0   \n",
+       "       2182-02-19 03:59:00                  0                    0   \n",
+       "       2182-02-20 03:31:00                  0                    0   \n",
+       "       2182-02-21 04:55:00                  0                    0   \n",
+       "199979 2182-02-06 09:17:00                  0                    0   \n",
+       "       2182-02-06 14:16:00                  0                    0   \n",
+       "199981 2110-09-24 16:34:00                  0                    0   \n",
+       "       2110-09-24 20:09:00                  0                    0   \n",
+       "       2110-09-25 06:10:00                  0                    0   \n",
+       "199987 2175-05-19 16:30:00                  0                    0   \n",
+       "199988 2169-01-24 12:48:00                  0                    0   \n",
+       "       2169-02-07 01:35:00                  0                    0   \n",
+       "       2169-02-07 11:18:00                  0                    0   \n",
+       "       2169-02-07 16:43:00                  0                    0   \n",
+       "       2169-02-07 22:35:00                  0                    0   \n",
+       "       2169-02-10 05:33:00                  0                    0   \n",
+       "199993 2161-11-12 23:14:00                  0                    0   \n",
+       "       2161-11-13 03:46:00                  0                    0   \n",
+       "199994 2188-07-07 21:23:00                  0                    0   \n",
+       "       2188-07-08 03:09:00                  0                    0   \n",
+       "       2188-07-08 04:13:00                  0                    0   \n",
+       "       2188-07-08 06:20:00                  0                    0   \n",
+       "199998 2119-02-20 10:52:00                  0                    0   \n",
+       "       2119-02-20 12:36:00                  0                    0   \n",
+       "       2119-02-20 13:33:00                  0                    0   \n",
+       "       2119-02-20 13:59:00                  0                    0   \n",
+       "       2119-02-20 20:43:00                  0                    0   \n",
+       "199999 2136-04-04 20:55:00                  0                    0   \n",
+       "       2136-04-06 15:29:00                  0                    0   \n",
+       "\n",
+       "label                                                              \\\n",
+       "status                                                              \n",
+       "variable_type                                                       \n",
+       "units                                                               \n",
+       "description                1531(mmol/L)_ERROR 1531(mmol/L)_VOIDED   \n",
+       "id     datetime                                                     \n",
+       "100001 2117-09-11 09:32:00                  0                   0   \n",
+       "100003 2150-04-17 19:12:00                  0                   0   \n",
+       "100006 2108-04-08 10:58:00                  0                   0   \n",
+       "100007 2145-03-31 00:44:00                  0                   0   \n",
+       "       2145-04-02 14:10:00                  0                   0   \n",
+       "100009 2162-05-17 13:19:00                  0                   0   \n",
+       "       2162-05-17 17:14:00                  0                   0   \n",
+       "100010 2109-12-10 10:25:00                  0                   0   \n",
+       "       2109-12-10 12:11:00                  0                   0   \n",
+       "       2109-12-10 13:05:00                  0                   0   \n",
+       "       2109-12-10 13:58:00                  0                   0   \n",
+       "100011 2177-08-29 04:44:00                  0                   0   \n",
+       "       2177-08-29 06:55:00                  0                   0   \n",
+       "100012 2177-03-14 07:38:00                  0                   0   \n",
+       "       2177-03-14 11:42:00                  0                   0   \n",
+       "       2177-03-15 08:05:00                  0                   0   \n",
+       "       2177-03-15 14:01:00                  0                   0   \n",
+       "       2177-03-15 21:42:00                  0                   0   \n",
+       "100016 2188-05-24 12:00:00                  0                   0   \n",
+       "100017 2103-03-11 05:10:00                  0                   0   \n",
+       "100018 2176-08-29 15:29:00                  0                   0   \n",
+       "       2176-08-30 09:23:00                  0                   0   \n",
+       "       2176-08-30 10:19:00                  0                   0   \n",
+       "       2176-08-30 11:29:00                  0                   0   \n",
+       "       2176-08-30 12:40:00                  0                   0   \n",
+       "100020 2142-11-30 21:54:00                  0                   0   \n",
+       "       2142-12-03 00:17:00                  0                   0   \n",
+       "100024 2170-09-19 10:25:00                  0                   0   \n",
+       "       2170-09-19 16:33:00                  0                   0   \n",
+       "       2170-09-20 02:04:00                  0                   0   \n",
+       "...                                       ...                 ...   \n",
+       "199976 2182-02-14 11:15:00                  0                   0   \n",
+       "       2182-02-16 03:57:00                  0                   0   \n",
+       "       2182-02-19 03:59:00                  0                   0   \n",
+       "       2182-02-20 03:31:00                  0                   0   \n",
+       "       2182-02-21 04:55:00                  0                   0   \n",
+       "199979 2182-02-06 09:17:00                  0                   0   \n",
+       "       2182-02-06 14:16:00                  0                   0   \n",
+       "199981 2110-09-24 16:34:00                  0                   0   \n",
+       "       2110-09-24 20:09:00                  0                   0   \n",
+       "       2110-09-25 06:10:00                  0                   0   \n",
+       "199987 2175-05-19 16:30:00                  0                   0   \n",
+       "199988 2169-01-24 12:48:00                  0                   0   \n",
+       "       2169-02-07 01:35:00                  0                   0   \n",
+       "       2169-02-07 11:18:00                  0                   0   \n",
+       "       2169-02-07 16:43:00                  0                   0   \n",
+       "       2169-02-07 22:35:00                  0                   0   \n",
+       "       2169-02-10 05:33:00                  0                   0   \n",
+       "199993 2161-11-12 23:14:00                  0                   0   \n",
+       "       2161-11-13 03:46:00                  0                   0   \n",
+       "199994 2188-07-07 21:23:00                  0                   0   \n",
+       "       2188-07-08 03:09:00                  0                   0   \n",
+       "       2188-07-08 04:13:00                  0                   0   \n",
+       "       2188-07-08 06:20:00                  0                   0   \n",
+       "199998 2119-02-20 10:52:00                  0                   0   \n",
+       "       2119-02-20 12:36:00                  0                   0   \n",
+       "       2119-02-20 13:33:00                  0                   0   \n",
+       "       2119-02-20 13:59:00                  0                   0   \n",
+       "       2119-02-20 20:43:00                  0                   0   \n",
+       "199999 2136-04-04 20:55:00                  0                   0   \n",
+       "       2136-04-06 15:29:00                  0                   0   \n",
+       "\n",
+       "label                                            \n",
+       "status                                           \n",
+       "variable_type                                    \n",
+       "units                                            \n",
+       "description                1531(mmol/L)_no data  \n",
+       "id     datetime                                  \n",
+       "100001 2117-09-11 09:32:00                    0  \n",
+       "100003 2150-04-17 19:12:00                    0  \n",
+       "100006 2108-04-08 10:58:00                    0  \n",
+       "100007 2145-03-31 00:44:00                    0  \n",
+       "       2145-04-02 14:10:00                    0  \n",
+       "100009 2162-05-17 13:19:00                    0  \n",
+       "       2162-05-17 17:14:00                    0  \n",
+       "100010 2109-12-10 10:25:00                    0  \n",
+       "       2109-12-10 12:11:00                    0  \n",
+       "       2109-12-10 13:05:00                    0  \n",
+       "       2109-12-10 13:58:00                    0  \n",
+       "100011 2177-08-29 04:44:00                    0  \n",
+       "       2177-08-29 06:55:00                    0  \n",
+       "100012 2177-03-14 07:38:00                    0  \n",
+       "       2177-03-14 11:42:00                    0  \n",
+       "       2177-03-15 08:05:00                    0  \n",
+       "       2177-03-15 14:01:00                    0  \n",
+       "       2177-03-15 21:42:00                    0  \n",
+       "100016 2188-05-24 12:00:00                    0  \n",
+       "100017 2103-03-11 05:10:00                    0  \n",
+       "100018 2176-08-29 15:29:00                    0  \n",
+       "       2176-08-30 09:23:00                    0  \n",
+       "       2176-08-30 10:19:00                    0  \n",
+       "       2176-08-30 11:29:00                    0  \n",
+       "       2176-08-30 12:40:00                    0  \n",
+       "100020 2142-11-30 21:54:00                    0  \n",
+       "       2142-12-03 00:17:00                    0  \n",
+       "100024 2170-09-19 10:25:00                    0  \n",
+       "       2170-09-19 16:33:00                    0  \n",
+       "       2170-09-20 02:04:00                    0  \n",
+       "...                                         ...  \n",
+       "199976 2182-02-14 11:15:00                    0  \n",
+       "       2182-02-16 03:57:00                    0  \n",
+       "       2182-02-19 03:59:00                    0  \n",
+       "       2182-02-20 03:31:00                    0  \n",
+       "       2182-02-21 04:55:00                    0  \n",
+       "199979 2182-02-06 09:17:00                    0  \n",
+       "       2182-02-06 14:16:00                    0  \n",
+       "199981 2110-09-24 16:34:00                    0  \n",
+       "       2110-09-24 20:09:00                    0  \n",
+       "       2110-09-25 06:10:00                    0  \n",
+       "199987 2175-05-19 16:30:00                    0  \n",
+       "199988 2169-01-24 12:48:00                    0  \n",
+       "       2169-02-07 01:35:00                    0  \n",
+       "       2169-02-07 11:18:00                    0  \n",
+       "       2169-02-07 16:43:00                    0  \n",
+       "       2169-02-07 22:35:00                    0  \n",
+       "       2169-02-10 05:33:00                    0  \n",
+       "199993 2161-11-12 23:14:00                    0  \n",
+       "       2161-11-13 03:46:00                    0  \n",
+       "199994 2188-07-07 21:23:00                    0  \n",
+       "       2188-07-08 03:09:00                    0  \n",
+       "       2188-07-08 04:13:00                    0  \n",
+       "       2188-07-08 06:20:00                    0  \n",
+       "199998 2119-02-20 10:52:00                    0  \n",
+       "       2119-02-20 12:36:00                    0  \n",
+       "       2119-02-20 13:33:00                    0  \n",
+       "       2119-02-20 13:59:00                    0  \n",
+       "       2119-02-20 20:43:00                    0  \n",
+       "199999 2136-04-04 20:55:00                    0  \n",
+       "       2136-04-06 15:29:00                    0  \n",
+       "\n",
+       "[177450 rows x 29 columns]"
+      ]
+     },
+     "execution_count": 28,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "nominal_cols = df_cleaned.columns.get_level_values('variable_type') == variable_type.NOMINAL\n",
+    "\n",
+    "for col_name in df_cleaned.loc[:,nominal_cols]:\n",
+    "    column = df_cleaned[col_nam]\n",
+    "    df_dummies = pd.get_dummies(column)\n",
+    "    dummy_col_names = [col_name[:-1] + ('{}_{}'.format(col_name[-1],text),) for text in df_dummies.columns]\n",
+    "    df_dummies.columns = pd.MultiIndex.from_tuples(dummy_col_names,names=df_cleaned.columns.names)\n",
+    "    \n",
+    "    df_cleaned.drop(col_name,axis=1,inplace=True)\n",
+    "    df_cleaned = df_cleaned.join(df_dummies,how='outer')\n",
+    "\n",
+    "df_cleaned"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Possible additional cleaning:\n",
+    "\n",
+    "1. Infer UOM \n",
+    "2. Remove extreme values [DONE]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "import utils\n",
+    "import mimic\n",
+    "import transformers\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "import icu_data_defs\n",
+    "import units"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "df_temp = utils.open_df('data/mimic_data','extract/temperature body')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(mimic)\n",
+    "pipeline = mimic.transform_pipeline('temperature body')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-25 00:00:00</td>\n",
+       "      <td>98.400001525878906</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>188670.0</td>\n",
+       "      <td>2183-08-23 20:00:00</td>\n",
+       "      <td>99.300003051757812</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-12 08:00:00</td>\n",
+       "      <td>98.699996948242188</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-13 17:00:00</td>\n",
+       "      <td>99.900001525878906</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>166707.0</td>\n",
+       "      <td>2122-02-11 20:00:00</td>\n",
+       "      <td>37.900001525878906</td>\n",
+       "      <td>degC</td>\n",
+       "      <td>676</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>166707.0</td>\n",
+       "      <td>2122-02-13 00:00:00</td>\n",
+       "      <td>97.800003051757812</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-11 21:00:00</td>\n",
+       "      <td>99.099998474121094</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-24 04:00:00</td>\n",
+       "      <td>98.900001525878906</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>176176.0</td>\n",
+       "      <td>2116-12-24 16:00:00</td>\n",
+       "      <td>99.099998474121094</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-13 03:00:00</td>\n",
+       "      <td>99.199996948242188</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-30 18:00:00</td>\n",
+       "      <td>98.800003051757812</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>181750.0</td>\n",
+       "      <td>2192-11-24 08:00:00</td>\n",
+       "      <td>98.5</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-14 12:00:00</td>\n",
+       "      <td>100.40000152587891</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-14 13:00:00</td>\n",
+       "      <td>100.69999694824219</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>14</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-15 22:00:00</td>\n",
+       "      <td>99.800003051757812</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>15</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-16 21:00:00</td>\n",
+       "      <td>100.59999847412109</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>16</th>\n",
+       "      <td>185910.0</td>\n",
+       "      <td>2166-08-23 08:00:00</td>\n",
+       "      <td>98</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>17</th>\n",
+       "      <td>190797.0</td>\n",
+       "      <td>2191-01-10 08:00:00</td>\n",
+       "      <td>97.900001525878906</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>18</th>\n",
+       "      <td>157907.0</td>\n",
+       "      <td>2129-06-10 23:00:00</td>\n",
+       "      <td>100.09999847412109</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>19</th>\n",
+       "      <td>157907.0</td>\n",
+       "      <td>2129-06-11 04:30:00</td>\n",
+       "      <td>98.800003051757812</td>\n",
+       "      <td>degF</td>\n",
+       "      <td>678</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "          id            datetime               value units  itemid\n",
+       "0   185910.0 2166-08-25 00:00:00  98.400001525878906  degF     678\n",
+       "1   188670.0 2183-08-23 20:00:00  99.300003051757812  degF     678\n",
+       "2   185910.0 2166-08-12 08:00:00  98.699996948242188  degF     678\n",
+       "3   185910.0 2166-08-13 17:00:00  99.900001525878906  degF     678\n",
+       "4   166707.0 2122-02-11 20:00:00  37.900001525878906  degC     676\n",
+       "5   166707.0 2122-02-13 00:00:00  97.800003051757812  degF     678\n",
+       "6   185910.0 2166-08-11 21:00:00  99.099998474121094  degF     678\n",
+       "7   185910.0 2166-08-24 04:00:00  98.900001525878906  degF     678\n",
+       "8   176176.0 2116-12-24 16:00:00  99.099998474121094  degF     678\n",
+       "9   185910.0 2166-08-13 03:00:00  99.199996948242188  degF     678\n",
+       "10  185910.0 2166-08-30 18:00:00  98.800003051757812  degF     678\n",
+       "11  181750.0 2192-11-24 08:00:00                98.5  degF     678\n",
+       "12  185910.0 2166-08-14 12:00:00  100.40000152587891  degF     678\n",
+       "13  185910.0 2166-08-14 13:00:00  100.69999694824219  degF     678\n",
+       "14  185910.0 2166-08-15 22:00:00  99.800003051757812  degF     678\n",
+       "15  185910.0 2166-08-16 21:00:00  100.59999847412109  degF     678\n",
+       "16  185910.0 2166-08-23 08:00:00                  98  degF     678\n",
+       "17  190797.0 2191-01-10 08:00:00  97.900001525878906  degF     678\n",
+       "18  157907.0 2129-06-10 23:00:00  100.09999847412109  degF     678\n",
+       "19  157907.0 2129-06-11 04:30:00  98.800003051757812  degF     678"
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "df_temp_tr = pipeline.transform(df_temp)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">degF</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">degC</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762</th>\n",
+       "      <th>676</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"20\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <td>98</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:00:00</th>\n",
+       "      <td>97.9</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:00:00</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <td>100</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 01:00:00</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 04:00:00</th>\n",
+       "      <td>97.7</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 08:00:00</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 12:00:00</th>\n",
+       "      <td>97.5</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 19:00:00</th>\n",
+       "      <td>99.8</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 00:00:00</th>\n",
+       "      <td>99.7</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 04:00:00</th>\n",
+       "      <td>99.3</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 08:00:00</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 12:00:00</th>\n",
+       "      <td>98.8</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 16:00:00</th>\n",
+       "      <td>99.3</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 22:00:00</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 00:00:00</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 04:00:00</th>\n",
+       "      <td>99.6</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 08:00:00</th>\n",
+       "      <td>99</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 13:00:00</th>\n",
+       "      <td>98</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 19:00:00</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      temperature body                     \n",
+       "units                                  degF          degC       \n",
+       "description                          223761 678    223762 676   \n",
+       "id     datetime                                                 \n",
+       "100001 2117-09-11 13:48:00               98   None   None   None\n",
+       "       2117-09-11 16:00:00             97.9   None   None   None\n",
+       "       2117-09-11 19:00:00             99.5   None   None   None\n",
+       "       2117-09-11 22:00:00              100   None   None   None\n",
+       "       2117-09-12 01:00:00             99.9   None   None   None\n",
+       "       2117-09-12 04:00:00             97.7   None   None   None\n",
+       "       2117-09-12 08:00:00             97.8   None   None   None\n",
+       "       2117-09-12 12:00:00             97.5   None   None   None\n",
+       "       2117-09-12 19:00:00             99.8   None   None   None\n",
+       "       2117-09-13 00:00:00             99.7   None   None   None\n",
+       "       2117-09-13 04:00:00             99.3   None   None   None\n",
+       "       2117-09-13 08:00:00             99.4   None   None   None\n",
+       "       2117-09-13 12:00:00             98.8   None   None   None\n",
+       "       2117-09-13 16:00:00             99.3   None   None   None\n",
+       "       2117-09-13 22:00:00             99.9   None   None   None\n",
+       "       2117-09-14 00:00:00             99.4   None   None   None\n",
+       "       2117-09-14 04:00:00             99.6   None   None   None\n",
+       "       2117-09-14 08:00:00               99   None   None   None\n",
+       "       2117-09-14 13:00:00               98   None   None   None\n",
+       "       2117-09-14 19:00:00             99.5   None   None   None"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_tr.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(transformers)\n",
+    "reload(units)\n",
+    "reload(icu_data_defs)\n",
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n",
+    "agg_func = lambda x:x.iloc[0]\n",
+    "ureg = units.MedicalUreg()\n",
+    "standard_pipeline = Pipeline([\n",
+    "        ('drop_small_columns',transformers.remove_small_columns(threshold=5)),\n",
+    "        ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func)),\n",
+    "        ('split_dtype',transformers.split_dtype())\n",
+    "    ])\n",
+    "\n",
+    "stnd_cols = transformers.column_standardizer(data_dict,ureg)\n",
+    "drop_oob = transformers.oob_value_remover(data_dict)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "df_temp_cl = standard_pipeline.transform(df_temp_tr)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">degF</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">degC</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762</th>\n",
+       "      <th>676</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"20\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:00:00</th>\n",
+       "      <td>97.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:00:00</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 01:00:00</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 04:00:00</th>\n",
+       "      <td>97.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 08:00:00</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 12:00:00</th>\n",
+       "      <td>97.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 19:00:00</th>\n",
+       "      <td>99.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 00:00:00</th>\n",
+       "      <td>99.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 04:00:00</th>\n",
+       "      <td>99.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 08:00:00</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 12:00:00</th>\n",
+       "      <td>98.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 16:00:00</th>\n",
+       "      <td>99.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 22:00:00</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 00:00:00</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 04:00:00</th>\n",
+       "      <td>99.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 08:00:00</th>\n",
+       "      <td>99.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 13:00:00</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 19:00:00</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      temperature body                     \n",
+       "units                                  degF          degC       \n",
+       "description                          223761 678    223762 676   \n",
+       "id     datetime                                                 \n",
+       "100001 2117-09-11 13:48:00             98.0    NaN    NaN    NaN\n",
+       "       2117-09-11 16:00:00             97.9    NaN    NaN    NaN\n",
+       "       2117-09-11 19:00:00             99.5    NaN    NaN    NaN\n",
+       "       2117-09-11 22:00:00            100.0    NaN    NaN    NaN\n",
+       "       2117-09-12 01:00:00             99.9    NaN    NaN    NaN\n",
+       "       2117-09-12 04:00:00             97.7    NaN    NaN    NaN\n",
+       "       2117-09-12 08:00:00             97.8    NaN    NaN    NaN\n",
+       "       2117-09-12 12:00:00             97.5    NaN    NaN    NaN\n",
+       "       2117-09-12 19:00:00             99.8    NaN    NaN    NaN\n",
+       "       2117-09-13 00:00:00             99.7    NaN    NaN    NaN\n",
+       "       2117-09-13 04:00:00             99.3    NaN    NaN    NaN\n",
+       "       2117-09-13 08:00:00             99.4    NaN    NaN    NaN\n",
+       "       2117-09-13 12:00:00             98.8    NaN    NaN    NaN\n",
+       "       2117-09-13 16:00:00             99.3    NaN    NaN    NaN\n",
+       "       2117-09-13 22:00:00             99.9    NaN    NaN    NaN\n",
+       "       2117-09-14 00:00:00             99.4    NaN    NaN    NaN\n",
+       "       2117-09-14 04:00:00             99.6    NaN    NaN    NaN\n",
+       "       2117-09-14 08:00:00             99.0    NaN    NaN    NaN\n",
+       "       2117-09-14 13:00:00             98.0    NaN    NaN    NaN\n",
+       "       2117-09-14 19:00:00             99.5    NaN    NaN    NaN"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_cl.head(20)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "df_temp_conv = stnd_cols.transform(df_temp_cl)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">degF</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762(degC)</th>\n",
+       "      <th>676(degC)</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>522143.000000</td>\n",
+       "      <td>768158.000000</td>\n",
+       "      <td>74144.000000</td>\n",
+       "      <td>370309.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>98.407970</td>\n",
+       "      <td>98.570606</td>\n",
+       "      <td>99.193821</td>\n",
+       "      <td>98.765740</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>14.681127</td>\n",
+       "      <td>2.666614</td>\n",
+       "      <td>9.735224</td>\n",
+       "      <td>2.608901</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>-99.900000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>26.600000</td>\n",
+       "      <td>32.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>97.500000</td>\n",
+       "      <td>97.599998</td>\n",
+       "      <td>97.520000</td>\n",
+       "      <td>97.879998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>98.300000</td>\n",
+       "      <td>98.599998</td>\n",
+       "      <td>98.600000</td>\n",
+       "      <td>98.960002</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>99.300000</td>\n",
+       "      <td>99.599998</td>\n",
+       "      <td>99.680000</td>\n",
+       "      <td>99.860002</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>9637.000000</td>\n",
+       "      <td>109.000000</td>\n",
+       "      <td>709.700000</td>\n",
+       "      <td>115.700000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         temperature body                                            \n",
+       "status                   known                                            \n",
+       "variable_type               qn                                            \n",
+       "units                     degF                                            \n",
+       "description             223761            678  223762(degC)      676(degC)\n",
+       "count            522143.000000  768158.000000  74144.000000  370309.000000\n",
+       "mean                 98.407970      98.570606     99.193821      98.765740\n",
+       "std                  14.681127       2.666614      9.735224       2.608901\n",
+       "min                 -99.900000       0.000000     26.600000      32.000000\n",
+       "25%                  97.500000      97.599998     97.520000      97.879998\n",
+       "50%                  98.300000      98.599998     98.600000      98.960002\n",
+       "75%                  99.300000      99.599998     99.680000      99.860002\n",
+       "max                9637.000000     109.000000    709.700000     115.700000"
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_conv.describe()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "df_temp_no_oob = drop_oob.transform(df_temp_conv)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">degF</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762(degC)</th>\n",
+       "      <th>676(degC)</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>522116.000000</td>\n",
+       "      <td>768158.000000</td>\n",
+       "      <td>73638.000000</td>\n",
+       "      <td>370309.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>98.352642</td>\n",
+       "      <td>98.570606</td>\n",
+       "      <td>98.430646</td>\n",
+       "      <td>98.765740</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>2.825922</td>\n",
+       "      <td>2.666614</td>\n",
+       "      <td>2.467125</td>\n",
+       "      <td>2.608901</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>26.600000</td>\n",
+       "      <td>32.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>97.500000</td>\n",
+       "      <td>97.599998</td>\n",
+       "      <td>97.340000</td>\n",
+       "      <td>97.879998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>98.300000</td>\n",
+       "      <td>98.599998</td>\n",
+       "      <td>98.600000</td>\n",
+       "      <td>98.960002</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>99.300000</td>\n",
+       "      <td>99.599998</td>\n",
+       "      <td>99.680000</td>\n",
+       "      <td>99.860002</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>129.000000</td>\n",
+       "      <td>109.000000</td>\n",
+       "      <td>113.000000</td>\n",
+       "      <td>115.700000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label         temperature body                                            \n",
+       "status                   known                                            \n",
+       "variable_type               qn                                            \n",
+       "units                     degF                                            \n",
+       "description             223761            678  223762(degC)      676(degC)\n",
+       "count            522116.000000  768158.000000  73638.000000  370309.000000\n",
+       "mean                 98.352642      98.570606     98.430646      98.765740\n",
+       "std                   2.825922       2.666614      2.467125       2.608901\n",
+       "min                   0.000000       0.000000     26.600000      32.000000\n",
+       "25%                  97.500000      97.599998     97.340000      97.879998\n",
+       "50%                  98.300000      98.599998     98.600000      98.960002\n",
+       "75%                  99.300000      99.599998     99.680000      99.860002\n",
+       "max                 129.000000     109.000000    113.000000     115.700000"
+      ]
+     },
+     "execution_count": 14,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_no_oob.describe()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "combine_like = transformers.combine_like_cols()\n",
+    "df_temp_combined = combine_like.transform(df_temp_no_oob)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th>temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th>known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th>qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th>degF</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>all</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"24\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <td>98.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:00:00</th>\n",
+       "      <td>97.900000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:00:00</th>\n",
+       "      <td>99.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <td>100.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 01:00:00</th>\n",
+       "      <td>99.900000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 04:00:00</th>\n",
+       "      <td>97.700000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 08:00:00</th>\n",
+       "      <td>97.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 12:00:00</th>\n",
+       "      <td>97.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 19:00:00</th>\n",
+       "      <td>99.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 00:00:00</th>\n",
+       "      <td>99.700000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 04:00:00</th>\n",
+       "      <td>99.300000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 08:00:00</th>\n",
+       "      <td>99.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 12:00:00</th>\n",
+       "      <td>98.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 16:00:00</th>\n",
+       "      <td>99.300000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 22:00:00</th>\n",
+       "      <td>99.900000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 00:00:00</th>\n",
+       "      <td>99.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 04:00:00</th>\n",
+       "      <td>99.600000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 08:00:00</th>\n",
+       "      <td>99.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 13:00:00</th>\n",
+       "      <td>98.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 19:00:00</th>\n",
+       "      <td>99.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 00:00:00</th>\n",
+       "      <td>99.600000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 08:00:00</th>\n",
+       "      <td>98.300000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 12:00:00</th>\n",
+       "      <td>97.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 16:00:00</th>\n",
+       "      <td>98.600000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"6\" valign=\"top\">100003</th>\n",
+       "      <th>2150-04-17 20:31:00</th>\n",
+       "      <td>95.900000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-17 22:00:00</th>\n",
+       "      <td>98.200000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 00:00:00</th>\n",
+       "      <td>97.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 04:00:00</th>\n",
+       "      <td>98.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 08:00:00</th>\n",
+       "      <td>97.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 11:18:00</th>\n",
+       "      <td>96.300000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"7\" valign=\"top\">199998</th>\n",
+       "      <th>2119-02-21 02:00:00</th>\n",
+       "      <td>100.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-21 03:00:00</th>\n",
+       "      <td>100.220003</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-21 04:00:00</th>\n",
+       "      <td>99.860002</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-21 05:00:00</th>\n",
+       "      <td>100.220003</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-21 06:00:00</th>\n",
+       "      <td>100.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-21 07:00:00</th>\n",
+       "      <td>100.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-21 08:00:00</th>\n",
+       "      <td>100.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"23\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-06 16:07:00</th>\n",
+       "      <td>97.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-06 20:00:00</th>\n",
+       "      <td>97.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 00:00:00</th>\n",
+       "      <td>97.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 02:00:00</th>\n",
+       "      <td>101.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 05:00:00</th>\n",
+       "      <td>100.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 08:00:00</th>\n",
+       "      <td>99.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 12:00:00</th>\n",
+       "      <td>99.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 15:00:00</th>\n",
+       "      <td>100.700000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 18:00:00</th>\n",
+       "      <td>97.600000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 22:00:00</th>\n",
+       "      <td>98.600000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 04:00:00</th>\n",
+       "      <td>98.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 09:00:00</th>\n",
+       "      <td>97.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 16:00:00</th>\n",
+       "      <td>97.700000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 20:00:00</th>\n",
+       "      <td>99.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 00:00:00</th>\n",
+       "      <td>99.600000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 05:00:00</th>\n",
+       "      <td>99.100000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 08:00:00</th>\n",
+       "      <td>97.800000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 12:00:00</th>\n",
+       "      <td>98.300000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 16:00:00</th>\n",
+       "      <td>98.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 20:00:00</th>\n",
+       "      <td>97.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 00:00:00</th>\n",
+       "      <td>97.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 03:00:00</th>\n",
+       "      <td>97.400000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-10 08:00:00</th>\n",
+       "      <td>98.100000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>1731503 rows × 1 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                      temperature body\n",
+       "status                                known\n",
+       "variable_type                            qn\n",
+       "units                                  degF\n",
+       "description                             all\n",
+       "id     datetime                            \n",
+       "100001 2117-09-11 13:48:00        98.000000\n",
+       "       2117-09-11 16:00:00        97.900000\n",
+       "       2117-09-11 19:00:00        99.500000\n",
+       "       2117-09-11 22:00:00       100.000000\n",
+       "       2117-09-12 01:00:00        99.900000\n",
+       "       2117-09-12 04:00:00        97.700000\n",
+       "       2117-09-12 08:00:00        97.800000\n",
+       "       2117-09-12 12:00:00        97.500000\n",
+       "       2117-09-12 19:00:00        99.800000\n",
+       "       2117-09-13 00:00:00        99.700000\n",
+       "       2117-09-13 04:00:00        99.300000\n",
+       "       2117-09-13 08:00:00        99.400000\n",
+       "       2117-09-13 12:00:00        98.800000\n",
+       "       2117-09-13 16:00:00        99.300000\n",
+       "       2117-09-13 22:00:00        99.900000\n",
+       "       2117-09-14 00:00:00        99.400000\n",
+       "       2117-09-14 04:00:00        99.600000\n",
+       "       2117-09-14 08:00:00        99.000000\n",
+       "       2117-09-14 13:00:00        98.000000\n",
+       "       2117-09-14 19:00:00        99.500000\n",
+       "       2117-09-15 00:00:00        99.600000\n",
+       "       2117-09-15 08:00:00        98.300000\n",
+       "       2117-09-15 12:00:00        97.800000\n",
+       "       2117-09-15 16:00:00        98.600000\n",
+       "100003 2150-04-17 20:31:00        95.900000\n",
+       "       2150-04-17 22:00:00        98.200000\n",
+       "       2150-04-18 00:00:00        97.400000\n",
+       "       2150-04-18 04:00:00        98.000000\n",
+       "       2150-04-18 08:00:00        97.400000\n",
+       "       2150-04-18 11:18:00        96.300000\n",
+       "...                                     ...\n",
+       "199998 2119-02-21 02:00:00       100.400000\n",
+       "       2119-02-21 03:00:00       100.220003\n",
+       "       2119-02-21 04:00:00        99.860002\n",
+       "       2119-02-21 05:00:00       100.220003\n",
+       "       2119-02-21 06:00:00       100.400000\n",
+       "       2119-02-21 07:00:00       100.400000\n",
+       "       2119-02-21 08:00:00       100.400000\n",
+       "199999 2136-04-06 16:07:00        97.800000\n",
+       "       2136-04-06 20:00:00        97.500000\n",
+       "       2136-04-07 00:00:00        97.400000\n",
+       "       2136-04-07 02:00:00       101.000000\n",
+       "       2136-04-07 05:00:00       100.500000\n",
+       "       2136-04-07 08:00:00        99.000000\n",
+       "       2136-04-07 12:00:00        99.800000\n",
+       "       2136-04-07 15:00:00       100.700000\n",
+       "       2136-04-07 18:00:00        97.600000\n",
+       "       2136-04-07 22:00:00        98.600000\n",
+       "       2136-04-08 04:00:00        98.500000\n",
+       "       2136-04-08 09:00:00        97.800000\n",
+       "       2136-04-08 16:00:00        97.700000\n",
+       "       2136-04-08 20:00:00        99.000000\n",
+       "       2136-04-09 00:00:00        99.600000\n",
+       "       2136-04-09 05:00:00        99.100000\n",
+       "       2136-04-09 08:00:00        97.800000\n",
+       "       2136-04-09 12:00:00        98.300000\n",
+       "       2136-04-09 16:00:00        98.000000\n",
+       "       2136-04-09 20:00:00        97.400000\n",
+       "       2136-04-10 00:00:00        97.400000\n",
+       "       2136-04-10 03:00:00        97.400000\n",
+       "       2136-04-10 08:00:00        98.100000\n",
+       "\n",
+       "[1731503 rows x 1 columns]"
+      ]
+     },
+     "execution_count": 28,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_combined"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Segmenting"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 29,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import segmenting"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 30,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "df_context = utils.open_df('data/mimic_data','context')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 31,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>pt_id</th>\n",
+       "      <th>id</th>\n",
+       "      <th>start_dt</th>\n",
+       "      <th>end_dt</th>\n",
+       "      <th>lang</th>\n",
+       "      <th>religion</th>\n",
+       "      <th>marital_status</th>\n",
+       "      <th>ethnicity</th>\n",
+       "      <th>dx_info</th>\n",
+       "      <th>admission_location</th>\n",
+       "      <th>...</th>\n",
+       "      <th>dod</th>\n",
+       "      <th>icd_codes</th>\n",
+       "      <th>age</th>\n",
+       "      <th>icustay_id</th>\n",
+       "      <th>dbsource</th>\n",
+       "      <th>first_icu</th>\n",
+       "      <th>last_icu</th>\n",
+       "      <th>intime</th>\n",
+       "      <th>outtime</th>\n",
+       "      <th>los</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>87</td>\n",
+       "      <td>190659</td>\n",
+       "      <td>2191-02-25 20:30:00</td>\n",
+       "      <td>2191-04-25 15:18:00</td>\n",
+       "      <td></td>\n",
+       "      <td>UNOBTAINABLE</td>\n",
+       "      <td></td>\n",
+       "      <td>UNKNOWN/NOT SPECIFIED</td>\n",
+       "      <td>NEWBORN</td>\n",
+       "      <td>PHYS REFERRAL/NORMAL DELI</td>\n",
+       "      <td>...</td>\n",
+       "      <td>None</td>\n",
+       "      <td>[V3101, 76515, 76524, 769, 7707, 7775, 7742, 7...</td>\n",
+       "      <td>0 days 20:30:00</td>\n",
+       "      <td>277633.0</td>\n",
+       "      <td>carevue</td>\n",
+       "      <td>NICU</td>\n",
+       "      <td>NICU</td>\n",
+       "      <td>2191-02-25 21:09:05</td>\n",
+       "      <td>2191-04-25 15:38:56</td>\n",
+       "      <td>58.7707</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>88</td>\n",
+       "      <td>123010</td>\n",
+       "      <td>2111-08-29 03:03:00</td>\n",
+       "      <td>2111-09-03 14:24:00</td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td></td>\n",
+       "      <td>BLACK/AFRICAN AMERICAN</td>\n",
+       "      <td>S/P MOTOR VEHICLE ACCIDENT-STABBING</td>\n",
+       "      <td>EMERGENCY ROOM ADMIT</td>\n",
+       "      <td>...</td>\n",
+       "      <td>None</td>\n",
+       "      <td>[86113, 5119, 4239, E966]</td>\n",
+       "      <td>10467 days 03:03:00</td>\n",
+       "      <td>297289.0</td>\n",
+       "      <td>carevue</td>\n",
+       "      <td>TSICU</td>\n",
+       "      <td>TSICU</td>\n",
+       "      <td>2111-08-29 03:04:42</td>\n",
+       "      <td>2111-08-30 21:08:09</td>\n",
+       "      <td>1.7524</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>89</td>\n",
+       "      <td>188646</td>\n",
+       "      <td>2185-06-17 05:22:00</td>\n",
+       "      <td>2185-06-21 11:15:00</td>\n",
+       "      <td></td>\n",
+       "      <td>UNOBTAINABLE</td>\n",
+       "      <td></td>\n",
+       "      <td>UNKNOWN/NOT SPECIFIED</td>\n",
+       "      <td>NEWBORN</td>\n",
+       "      <td>PHYS REFERRAL/NORMAL DELI</td>\n",
+       "      <td>...</td>\n",
+       "      <td>None</td>\n",
+       "      <td>[V3101, 7742, 76516, 76527, 22801, V290]</td>\n",
+       "      <td>0 days 05:22:00</td>\n",
+       "      <td>249786.0</td>\n",
+       "      <td>carevue</td>\n",
+       "      <td>NICU</td>\n",
+       "      <td>NICU</td>\n",
+       "      <td>2185-06-17 05:46:00</td>\n",
+       "      <td>2185-06-21 12:00:41</td>\n",
+       "      <td>4.2602</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>91</td>\n",
+       "      <td>121205</td>\n",
+       "      <td>2177-04-23 00:08:00</td>\n",
+       "      <td>2177-05-10 15:16:00</td>\n",
+       "      <td></td>\n",
+       "      <td>JEWISH</td>\n",
+       "      <td>MARRIED</td>\n",
+       "      <td>WHITE</td>\n",
+       "      <td>FEVER</td>\n",
+       "      <td>EMERGENCY ROOM ADMIT</td>\n",
+       "      <td>...</td>\n",
+       "      <td>2177-05-10 00:00:00</td>\n",
+       "      <td>[20008, 2765, 5559, 99812, 51881, 4470, 135, 5...</td>\n",
+       "      <td>29794 days 00:08:00</td>\n",
+       "      <td>218528.0</td>\n",
+       "      <td>carevue</td>\n",
+       "      <td>CSRU</td>\n",
+       "      <td>CSRU</td>\n",
+       "      <td>2177-04-27 02:08:00</td>\n",
+       "      <td>2177-04-27 14:03:00</td>\n",
+       "      <td>0.4965</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>91</td>\n",
+       "      <td>121205</td>\n",
+       "      <td>2177-04-23 00:08:00</td>\n",
+       "      <td>2177-05-10 15:16:00</td>\n",
+       "      <td></td>\n",
+       "      <td>JEWISH</td>\n",
+       "      <td>MARRIED</td>\n",
+       "      <td>WHITE</td>\n",
+       "      <td>FEVER</td>\n",
+       "      <td>EMERGENCY ROOM ADMIT</td>\n",
+       "      <td>...</td>\n",
+       "      <td>2177-05-10 00:00:00</td>\n",
+       "      <td>[20008, 2765, 5559, 99812, 51881, 4470, 135, 5...</td>\n",
+       "      <td>29794 days 00:08:00</td>\n",
+       "      <td>256972.0</td>\n",
+       "      <td>carevue</td>\n",
+       "      <td>MICU</td>\n",
+       "      <td>MICU</td>\n",
+       "      <td>2177-05-07 03:52:00</td>\n",
+       "      <td>2177-05-10 15:16:00</td>\n",
+       "      <td>3.4750</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>5 rows × 22 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   pt_id      id            start_dt              end_dt lang      religion  \\\n",
+       "0     87  190659 2191-02-25 20:30:00 2191-04-25 15:18:00       UNOBTAINABLE   \n",
+       "1     88  123010 2111-08-29 03:03:00 2111-09-03 14:24:00                      \n",
+       "2     89  188646 2185-06-17 05:22:00 2185-06-21 11:15:00       UNOBTAINABLE   \n",
+       "3     91  121205 2177-04-23 00:08:00 2177-05-10 15:16:00             JEWISH   \n",
+       "4     91  121205 2177-04-23 00:08:00 2177-05-10 15:16:00             JEWISH   \n",
+       "\n",
+       "  marital_status               ethnicity                              dx_info  \\\n",
+       "0                  UNKNOWN/NOT SPECIFIED                              NEWBORN   \n",
+       "1                 BLACK/AFRICAN AMERICAN  S/P MOTOR VEHICLE ACCIDENT-STABBING   \n",
+       "2                  UNKNOWN/NOT SPECIFIED                              NEWBORN   \n",
+       "3        MARRIED                   WHITE                                FEVER   \n",
+       "4        MARRIED                   WHITE                                FEVER   \n",
+       "\n",
+       "          admission_location   ...                     dod  \\\n",
+       "0  PHYS REFERRAL/NORMAL DELI   ...                    None   \n",
+       "1       EMERGENCY ROOM ADMIT   ...                    None   \n",
+       "2  PHYS REFERRAL/NORMAL DELI   ...                    None   \n",
+       "3       EMERGENCY ROOM ADMIT   ...     2177-05-10 00:00:00   \n",
+       "4       EMERGENCY ROOM ADMIT   ...     2177-05-10 00:00:00   \n",
+       "\n",
+       "                                           icd_codes                 age  \\\n",
+       "0  [V3101, 76515, 76524, 769, 7707, 7775, 7742, 7...     0 days 20:30:00   \n",
+       "1                          [86113, 5119, 4239, E966] 10467 days 03:03:00   \n",
+       "2           [V3101, 7742, 76516, 76527, 22801, V290]     0 days 05:22:00   \n",
+       "3  [20008, 2765, 5559, 99812, 51881, 4470, 135, 5... 29794 days 00:08:00   \n",
+       "4  [20008, 2765, 5559, 99812, 51881, 4470, 135, 5... 29794 days 00:08:00   \n",
+       "\n",
+       "  icustay_id  dbsource  first_icu last_icu              intime  \\\n",
+       "0   277633.0   carevue       NICU     NICU 2191-02-25 21:09:05   \n",
+       "1   297289.0   carevue      TSICU    TSICU 2111-08-29 03:04:42   \n",
+       "2   249786.0   carevue       NICU     NICU 2185-06-17 05:46:00   \n",
+       "3   218528.0   carevue       CSRU     CSRU 2177-04-27 02:08:00   \n",
+       "4   256972.0   carevue       MICU     MICU 2177-05-07 03:52:00   \n",
+       "\n",
+       "              outtime      los  \n",
+       "0 2191-04-25 15:38:56  58.7707  \n",
+       "1 2111-08-30 21:08:09   1.7524  \n",
+       "2 2185-06-21 12:00:41   4.2602  \n",
+       "3 2177-04-27 14:03:00   0.4965  \n",
+       "4 2177-05-10 15:16:00   3.4750  \n",
+       "\n",
+       "[5 rows x 22 columns]"
+      ]
+     },
+     "execution_count": 31,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_context.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 33,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "end_dt = df_temp_combined.iloc[:,0].groupby(level='id').apply(lambda x:x.sample(1))\n",
+    "end_dt = end_dt.reset_index(level=0,drop=True).reset_index(level=1,drop=False).iloc[:,0]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 34,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(segmenting)\n",
+    "reload(utils)\n",
+    "all_before = segmenting.all_before(end_dt,df_context)\n",
+    "n_hrs_before = segmenting.n_hrs_before(end_dt,10)\n",
+    "periodic = segmenting.periodic(10,df_context)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 138,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "C:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\tools\\merge.py:480: UserWarning: merging between different levels can give an unintended result (3 levels on the left, 1 on the right)\n",
+      "  warnings.warn(msg, UserWarning)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">degF</th>\n",
+       "      <th colspan=\"2\" halign=\"left\">degC</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762</th>\n",
+       "      <th>676</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>seg_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"8\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 01:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 12:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100003</th>\n",
+       "      <th>2150-04-17 20:31:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>95.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-17 22:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"19\" valign=\"top\">100006</th>\n",
+       "      <th>2108-04-06 16:30:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-06 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-07 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-07 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-07 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-07 12:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-07 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-08 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.599998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-08 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-08 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-08 12:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-08 16:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-08 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-09 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-09 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-09 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-09 12:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-09 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.599998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2108-04-10 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"10\" valign=\"top\">199998</th>\n",
+       "      <th>2119-02-20 17:15:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.299999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 17:30:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 17:45:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.599998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 18:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.900002</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 18:30:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.200001</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 19:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.599998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.799999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 21:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.799999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 22:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.799999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2119-02-20 23:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.700001</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"20\" valign=\"top\">199999</th>\n",
+       "      <th>2136-04-06 16:07:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-06 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 02:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>101.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 05:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 12:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 15:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 18:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-07 22:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 09:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 16:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-08 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 05:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 12:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 16:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2136-04-09 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>839877 rows × 4 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                             temperature body                    \\\n",
+       "units                                         degF              degC   \n",
+       "description                                 223761     678    223762   \n",
+       "id     datetime            seg_id                                      \n",
+       "100001 2117-09-11 13:48:00 0                  98.0        NaN    NaN   \n",
+       "       2117-09-11 16:00:00 0                  97.9        NaN    NaN   \n",
+       "       2117-09-11 19:00:00 0                  99.5        NaN    NaN   \n",
+       "       2117-09-11 22:00:00 0                 100.0        NaN    NaN   \n",
+       "       2117-09-12 01:00:00 0                  99.9        NaN    NaN   \n",
+       "       2117-09-12 04:00:00 0                  97.7        NaN    NaN   \n",
+       "       2117-09-12 08:00:00 0                  97.8        NaN    NaN   \n",
+       "       2117-09-12 12:00:00 0                  97.5        NaN    NaN   \n",
+       "100003 2150-04-17 20:31:00 0                  95.9        NaN    NaN   \n",
+       "       2150-04-17 22:00:00 0                  98.2        NaN    NaN   \n",
+       "       2150-04-18 00:00:00 0                  97.4        NaN    NaN   \n",
+       "100006 2108-04-06 16:30:00 0                   NaN  97.000000    NaN   \n",
+       "       2108-04-06 20:00:00 0                   NaN  97.400002    NaN   \n",
+       "       2108-04-07 00:00:00 0                   NaN  97.800003    NaN   \n",
+       "       2108-04-07 04:00:00 0                   NaN  97.000000    NaN   \n",
+       "       2108-04-07 08:00:00 0                   NaN  97.099998    NaN   \n",
+       "       2108-04-07 12:00:00 0                   NaN  97.000000    NaN   \n",
+       "       2108-04-07 20:00:00 0                   NaN  98.800003    NaN   \n",
+       "       2108-04-08 00:00:00 0                   NaN  98.599998    NaN   \n",
+       "       2108-04-08 04:00:00 0                   NaN  98.000000    NaN   \n",
+       "       2108-04-08 08:00:00 0                   NaN  97.199997    NaN   \n",
+       "       2108-04-08 12:00:00 0                   NaN  97.000000    NaN   \n",
+       "       2108-04-08 16:00:00 0                   NaN  98.000000    NaN   \n",
+       "       2108-04-08 20:00:00 0                   NaN  98.800003    NaN   \n",
+       "       2108-04-09 00:00:00 0                   NaN  97.199997    NaN   \n",
+       "       2108-04-09 04:00:00 0                   NaN  97.400002    NaN   \n",
+       "       2108-04-09 08:00:00 0                   NaN  97.099998    NaN   \n",
+       "       2108-04-09 12:00:00 0                   NaN  97.300003    NaN   \n",
+       "       2108-04-09 20:00:00 0                   NaN  97.599998    NaN   \n",
+       "       2108-04-10 00:00:00 0                   NaN  97.000000    NaN   \n",
+       "...                                            ...        ...    ...   \n",
+       "199998 2119-02-20 17:15:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 17:30:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 17:45:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 18:00:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 18:30:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 19:00:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 20:00:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 21:00:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 22:00:00 0                   NaN        NaN    NaN   \n",
+       "       2119-02-20 23:00:00 0                   NaN        NaN    NaN   \n",
+       "199999 2136-04-06 16:07:00 0                  97.8        NaN    NaN   \n",
+       "       2136-04-06 20:00:00 0                  97.5        NaN    NaN   \n",
+       "       2136-04-07 00:00:00 0                  97.4        NaN    NaN   \n",
+       "       2136-04-07 02:00:00 0                 101.0        NaN    NaN   \n",
+       "       2136-04-07 05:00:00 0                 100.5        NaN    NaN   \n",
+       "       2136-04-07 08:00:00 0                  99.0        NaN    NaN   \n",
+       "       2136-04-07 12:00:00 0                  99.8        NaN    NaN   \n",
+       "       2136-04-07 15:00:00 0                 100.7        NaN    NaN   \n",
+       "       2136-04-07 18:00:00 0                  97.6        NaN    NaN   \n",
+       "       2136-04-07 22:00:00 0                  98.6        NaN    NaN   \n",
+       "       2136-04-08 04:00:00 0                  98.5        NaN    NaN   \n",
+       "       2136-04-08 09:00:00 0                  97.8        NaN    NaN   \n",
+       "       2136-04-08 16:00:00 0                  97.7        NaN    NaN   \n",
+       "       2136-04-08 20:00:00 0                  99.0        NaN    NaN   \n",
+       "       2136-04-09 00:00:00 0                  99.6        NaN    NaN   \n",
+       "       2136-04-09 05:00:00 0                  99.1        NaN    NaN   \n",
+       "       2136-04-09 08:00:00 0                  97.8        NaN    NaN   \n",
+       "       2136-04-09 12:00:00 0                  98.3        NaN    NaN   \n",
+       "       2136-04-09 16:00:00 0                  98.0        NaN    NaN   \n",
+       "       2136-04-09 20:00:00 0                  97.4        NaN    NaN   \n",
+       "\n",
+       "label                                         \n",
+       "units                                         \n",
+       "description                           676     \n",
+       "id     datetime            seg_id             \n",
+       "100001 2117-09-11 13:48:00 0             NaN  \n",
+       "       2117-09-11 16:00:00 0             NaN  \n",
+       "       2117-09-11 19:00:00 0             NaN  \n",
+       "       2117-09-11 22:00:00 0             NaN  \n",
+       "       2117-09-12 01:00:00 0             NaN  \n",
+       "       2117-09-12 04:00:00 0             NaN  \n",
+       "       2117-09-12 08:00:00 0             NaN  \n",
+       "       2117-09-12 12:00:00 0             NaN  \n",
+       "100003 2150-04-17 20:31:00 0             NaN  \n",
+       "       2150-04-17 22:00:00 0             NaN  \n",
+       "       2150-04-18 00:00:00 0             NaN  \n",
+       "100006 2108-04-06 16:30:00 0             NaN  \n",
+       "       2108-04-06 20:00:00 0             NaN  \n",
+       "       2108-04-07 00:00:00 0             NaN  \n",
+       "       2108-04-07 04:00:00 0             NaN  \n",
+       "       2108-04-07 08:00:00 0             NaN  \n",
+       "       2108-04-07 12:00:00 0             NaN  \n",
+       "       2108-04-07 20:00:00 0             NaN  \n",
+       "       2108-04-08 00:00:00 0             NaN  \n",
+       "       2108-04-08 04:00:00 0             NaN  \n",
+       "       2108-04-08 08:00:00 0             NaN  \n",
+       "       2108-04-08 12:00:00 0             NaN  \n",
+       "       2108-04-08 16:00:00 0             NaN  \n",
+       "       2108-04-08 20:00:00 0             NaN  \n",
+       "       2108-04-09 00:00:00 0             NaN  \n",
+       "       2108-04-09 04:00:00 0             NaN  \n",
+       "       2108-04-09 08:00:00 0             NaN  \n",
+       "       2108-04-09 12:00:00 0             NaN  \n",
+       "       2108-04-09 20:00:00 0             NaN  \n",
+       "       2108-04-10 00:00:00 0             NaN  \n",
+       "...                                      ...  \n",
+       "199998 2119-02-20 17:15:00 0       36.299999  \n",
+       "       2119-02-20 17:30:00 0       36.500000  \n",
+       "       2119-02-20 17:45:00 0       36.599998  \n",
+       "       2119-02-20 18:00:00 0       36.900002  \n",
+       "       2119-02-20 18:30:00 0       37.200001  \n",
+       "       2119-02-20 19:00:00 0       37.599998  \n",
+       "       2119-02-20 20:00:00 0       37.799999  \n",
+       "       2119-02-20 21:00:00 0       37.799999  \n",
+       "       2119-02-20 22:00:00 0       37.799999  \n",
+       "       2119-02-20 23:00:00 0       37.700001  \n",
+       "199999 2136-04-06 16:07:00 0             NaN  \n",
+       "       2136-04-06 20:00:00 0             NaN  \n",
+       "       2136-04-07 00:00:00 0             NaN  \n",
+       "       2136-04-07 02:00:00 0             NaN  \n",
+       "       2136-04-07 05:00:00 0             NaN  \n",
+       "       2136-04-07 08:00:00 0             NaN  \n",
+       "       2136-04-07 12:00:00 0             NaN  \n",
+       "       2136-04-07 15:00:00 0             NaN  \n",
+       "       2136-04-07 18:00:00 0             NaN  \n",
+       "       2136-04-07 22:00:00 0             NaN  \n",
+       "       2136-04-08 04:00:00 0             NaN  \n",
+       "       2136-04-08 09:00:00 0             NaN  \n",
+       "       2136-04-08 16:00:00 0             NaN  \n",
+       "       2136-04-08 20:00:00 0             NaN  \n",
+       "       2136-04-09 00:00:00 0             NaN  \n",
+       "       2136-04-09 05:00:00 0             NaN  \n",
+       "       2136-04-09 08:00:00 0             NaN  \n",
+       "       2136-04-09 12:00:00 0             NaN  \n",
+       "       2136-04-09 16:00:00 0             NaN  \n",
+       "       2136-04-09 20:00:00 0             NaN  \n",
+       "\n",
+       "[839877 rows x 4 columns]"
+      ]
+     },
+     "execution_count": 138,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_all_before = all_before.transform(df_temp_cl)\n",
+    "df_temp_all_before[df_temp_all_before.index.get_level_values('seg_id') > -1]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 262,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "                            seg_id\n",
+      "id     datetime                   \n",
+      "100001 2117-09-11 22:00:00       0\n",
+      "       2117-09-12 01:00:00       0\n",
+      "       2117-09-12 04:00:00       0\n",
+      "100006 2108-04-07 20:00:00       0\n",
+      "100007 2145-04-04 00:00:00       0\n",
+      "       2145-04-04 04:00:00       0\n",
+      "100009 2162-05-19 03:00:00       0\n",
+      "100010 2109-12-10 22:47:00       0\n",
+      "       2109-12-11 00:00:00       0\n",
+      "100011 2177-09-07 09:00:00       0\n",
+      "       2177-09-07 13:00:00       0\n",
+      "       2177-09-07 17:00:00       0\n",
+      "label                             temperature body                           \n",
+      "status                                       known                           \n",
+      "variable_type                                   qn                           \n",
+      "units                                         degF                           \n",
+      "description                                 223761 678 223762(degC) 676(degC)\n",
+      "id     datetime            seg_id                                            \n",
+      "100001 2117-09-11 13:48:00 -1                 98.0 NaN          NaN       NaN\n",
+      "       2117-09-11 16:00:00 -1                 97.9 NaN          NaN       NaN\n",
+      "       2117-09-11 19:00:00 -1                 99.5 NaN          NaN       NaN\n",
+      "       2117-09-11 22:00:00  0                100.0 NaN          NaN       NaN\n",
+      "       2117-09-12 01:00:00  0                 99.9 NaN          NaN       NaN\n",
+      "       2117-09-12 04:00:00  0                 97.7 NaN          NaN       NaN\n",
+      "       2117-09-12 08:00:00 -1                 97.8 NaN          NaN       NaN\n",
+      "       2117-09-12 12:00:00 -1                 97.5 NaN          NaN       NaN\n",
+      "       2117-09-12 19:00:00 -1                 99.8 NaN          NaN       NaN\n",
+      "       2117-09-13 00:00:00 -1                 99.7 NaN          NaN       NaN\n",
+      "       2117-09-13 04:00:00 -1                 99.3 NaN          NaN       NaN\n",
+      "       2117-09-13 08:00:00 -1                 99.4 NaN          NaN       NaN\n",
+      "       2117-09-13 12:00:00 -1                 98.8 NaN          NaN       NaN\n",
+      "       2117-09-13 16:00:00 -1                 99.3 NaN          NaN       NaN\n",
+      "       2117-09-13 22:00:00 -1                 99.9 NaN          NaN       NaN\n",
+      "       2117-09-14 00:00:00 -1                 99.4 NaN          NaN       NaN\n",
+      "       2117-09-14 04:00:00 -1                 99.6 NaN          NaN       NaN\n",
+      "       2117-09-14 08:00:00 -1                 99.0 NaN          NaN       NaN\n",
+      "       2117-09-14 13:00:00 -1                 98.0 NaN          NaN       NaN\n",
+      "       2117-09-14 19:00:00 -1                 99.5 NaN          NaN       NaN\n",
+      "       2117-09-15 00:00:00 -1                 99.6 NaN          NaN       NaN\n",
+      "       2117-09-15 08:00:00 -1                 98.3 NaN          NaN       NaN\n",
+      "       2117-09-15 12:00:00 -1                 97.8 NaN          NaN       NaN\n",
+      "       2117-09-15 16:00:00 -1                 98.6 NaN          NaN       NaN\n",
+      "100003 2150-04-17 20:31:00 -1                 95.9 NaN          NaN       NaN\n",
+      "       2150-04-17 22:00:00 -1                 98.2 NaN          NaN       NaN\n",
+      "       2150-04-18 00:00:00 -1                 97.4 NaN          NaN       NaN\n",
+      "       2150-04-18 04:00:00 -1                 98.0 NaN          NaN       NaN\n",
+      "       2150-04-18 08:00:00 -1                 97.4 NaN          NaN       NaN\n",
+      "       2150-04-18 11:18:00 -1                 96.3 NaN          NaN       NaN\n",
+      "...                                            ...  ..          ...       ...\n",
+      "100011 2177-09-04 19:00:00 -1                101.0 NaN          NaN       NaN\n",
+      "       2177-09-04 20:00:00 -1                101.2 NaN          NaN       NaN\n",
+      "       2177-09-04 22:00:00 -1                102.1 NaN          NaN       NaN\n",
+      "       2177-09-05 00:00:00 -1                101.8 NaN          NaN       NaN\n",
+      "       2177-09-05 02:00:00 -1                100.8 NaN          NaN       NaN\n",
+      "       2177-09-05 04:00:00 -1                100.1 NaN          NaN       NaN\n",
+      "       2177-09-05 06:00:00 -1                100.1 NaN          NaN       NaN\n",
+      "       2177-09-05 08:00:00 -1                 99.5 NaN          NaN       NaN\n",
+      "       2177-09-05 10:00:00 -1                101.4 NaN          NaN       NaN\n",
+      "       2177-09-05 12:00:00 -1                101.1 NaN          NaN       NaN\n",
+      "       2177-09-05 14:00:00 -1                 99.8 NaN          NaN       NaN\n",
+      "       2177-09-05 16:00:00 -1                 97.5 NaN          NaN       NaN\n",
+      "       2177-09-05 20:00:00 -1                102.0 NaN          NaN       NaN\n",
+      "       2177-09-05 23:00:00 -1                100.8 NaN          NaN       NaN\n",
+      "       2177-09-06 02:00:00 -1                101.0 NaN          NaN       NaN\n",
+      "       2177-09-06 04:00:00 -1                101.2 NaN          NaN       NaN\n",
+      "       2177-09-06 08:00:00 -1                100.1 NaN          NaN       NaN\n",
+      "       2177-09-06 12:00:00 -1                100.1 NaN          NaN       NaN\n",
+      "       2177-09-06 16:00:00 -1                102.7 NaN          NaN       NaN\n",
+      "       2177-09-06 18:00:00 -1                102.0 NaN          NaN       NaN\n",
+      "       2177-09-06 20:00:00 -1                101.3 NaN          NaN       NaN\n",
+      "       2177-09-06 23:00:00 -1                101.9 NaN          NaN       NaN\n",
+      "       2177-09-07 00:00:00 -1                 99.9 NaN          NaN       NaN\n",
+      "       2177-09-07 04:00:00 -1                100.5 NaN          NaN       NaN\n",
+      "       2177-09-07 09:00:00  0                 99.5 NaN          NaN       NaN\n",
+      "       2177-09-07 13:00:00  0                 99.1 NaN          NaN       NaN\n",
+      "       2177-09-07 17:00:00  0                 99.2 NaN          NaN       NaN\n",
+      "       2177-09-07 19:00:00 -1                 99.9 NaN          NaN       NaN\n",
+      "       2177-09-08 00:00:00 -1                 99.8 NaN          NaN       NaN\n",
+      "       2177-09-08 04:00:00 -1                 99.5 NaN          NaN       NaN\n",
+      "\n",
+      "[200 rows x 4 columns]\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">degF</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762(degC)</th>\n",
+       "      <th>676(degC)</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>seg_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 01:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100006</th>\n",
+       "      <th>2108-04-07 20:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100007</th>\n",
+       "      <th>2145-04-04 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.699997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2145-04-04 04:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100009</th>\n",
+       "      <th>2162-05-19 03:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100010</th>\n",
+       "      <th>2109-12-10 22:47:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2109-12-11 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100011</th>\n",
+       "      <th>2177-09-07 09:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-09-07 13:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2177-09-07 17:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                             temperature body                          \\\n",
+       "status                                       known                           \n",
+       "variable_type                                   qn                           \n",
+       "units                                         degF                           \n",
+       "description                                 223761        678 223762(degC)   \n",
+       "id     datetime            seg_id                                            \n",
+       "100001 2117-09-11 22:00:00 0                 100.0        NaN          NaN   \n",
+       "       2117-09-12 01:00:00 0                  99.9        NaN          NaN   \n",
+       "       2117-09-12 04:00:00 0                  97.7        NaN          NaN   \n",
+       "100006 2108-04-07 20:00:00 0                   NaN  98.800003          NaN   \n",
+       "100007 2145-04-04 00:00:00 0                   NaN  98.699997          NaN   \n",
+       "       2145-04-04 04:00:00 0                   NaN  97.400002          NaN   \n",
+       "100009 2162-05-19 03:00:00 0                  98.6        NaN          NaN   \n",
+       "100010 2109-12-10 22:47:00 0                 100.2        NaN          NaN   \n",
+       "       2109-12-11 00:00:00 0                  98.8        NaN          NaN   \n",
+       "100011 2177-09-07 09:00:00 0                  99.5        NaN          NaN   \n",
+       "       2177-09-07 13:00:00 0                  99.1        NaN          NaN   \n",
+       "       2177-09-07 17:00:00 0                  99.2        NaN          NaN   \n",
+       "\n",
+       "label                                        \n",
+       "status                                       \n",
+       "variable_type                                \n",
+       "units                                        \n",
+       "description                       676(degC)  \n",
+       "id     datetime            seg_id            \n",
+       "100001 2117-09-11 22:00:00 0            NaN  \n",
+       "       2117-09-12 01:00:00 0            NaN  \n",
+       "       2117-09-12 04:00:00 0            NaN  \n",
+       "100006 2108-04-07 20:00:00 0            NaN  \n",
+       "100007 2145-04-04 00:00:00 0            NaN  \n",
+       "       2145-04-04 04:00:00 0            NaN  \n",
+       "100009 2162-05-19 03:00:00 0            NaN  \n",
+       "100010 2109-12-10 22:47:00 0            NaN  \n",
+       "       2109-12-11 00:00:00 0            NaN  \n",
+       "100011 2177-09-07 09:00:00 0            NaN  \n",
+       "       2177-09-07 13:00:00 0            NaN  \n",
+       "       2177-09-07 17:00:00 0            NaN  "
+      ]
+     },
+     "execution_count": 262,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_Nhr_before = n_hrs_before.transform(df_temp_combined.head(200))\n",
+    "df_temp_Nhr_before[df_temp_Nhr_before.index.get_level_values('seg_id') > -1]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 266,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>label</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">temperature body</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">known</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">degF</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>223761</th>\n",
+       "      <th>678</th>\n",
+       "      <th>223762(degC)</th>\n",
+       "      <th>676(degC)</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>seg_id</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"24\" valign=\"top\">100001</th>\n",
+       "      <th>2117-09-11 13:48:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 16:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 19:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-11 22:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 01:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 04:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>97.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 08:00:00</th>\n",
+       "      <th>2</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 12:00:00</th>\n",
+       "      <th>2</th>\n",
+       "      <td>97.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-12 19:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>99.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 00:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>99.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 04:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>99.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 08:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 12:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>98.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 16:00:00</th>\n",
+       "      <th>5</th>\n",
+       "      <td>99.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-13 22:00:00</th>\n",
+       "      <th>5</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 00:00:00</th>\n",
+       "      <th>6</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 04:00:00</th>\n",
+       "      <th>6</th>\n",
+       "      <td>99.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 08:00:00</th>\n",
+       "      <th>6</th>\n",
+       "      <td>99.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 13:00:00</th>\n",
+       "      <th>7</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-14 19:00:00</th>\n",
+       "      <th>7</th>\n",
+       "      <td>99.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 00:00:00</th>\n",
+       "      <th>8</th>\n",
+       "      <td>99.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 08:00:00</th>\n",
+       "      <th>9</th>\n",
+       "      <td>98.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 12:00:00</th>\n",
+       "      <th>9</th>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2117-09-15 16:00:00</th>\n",
+       "      <th>10</th>\n",
+       "      <td>98.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"6\" valign=\"top\">100003</th>\n",
+       "      <th>2150-04-17 20:31:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>95.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-17 22:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 00:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>97.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 04:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 08:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>97.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2150-04-18 11:18:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>96.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"16\" valign=\"top\">100114</th>\n",
+       "      <th>2157-09-19 18:15:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-19 18:30:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-19 20:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-19 23:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 00:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.599998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 01:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 01:15:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 02:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 06:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 08:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.699997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 09:15:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 09:30:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 10:00:00</th>\n",
+       "      <th>4</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 12:00:00</th>\n",
+       "      <th>5</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 15:00:00</th>\n",
+       "      <th>5</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2157-09-20 18:00:00</th>\n",
+       "      <th>5</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"13\" valign=\"top\">100116</th>\n",
+       "      <th>2173-07-27 05:13:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 08:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 09:30:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 11:00:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>98.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 14:25:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>100.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 16:30:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>100.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 18:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>99.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-27 20:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>100.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-28 00:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>99.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-28 04:00:00</th>\n",
+       "      <th>2</th>\n",
+       "      <td>98.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-28 08:00:00</th>\n",
+       "      <th>2</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-28 12:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>98.5</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2173-07-28 16:00:00</th>\n",
+       "      <th>3</th>\n",
+       "      <td>99.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>100117</th>\n",
+       "      <th>2166-04-30 21:39:00</th>\n",
+       "      <th>0</th>\n",
+       "      <td>99.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>2000 rows × 4 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "label                             temperature body                          \\\n",
+       "status                                       known                           \n",
+       "variable_type                                   qn                           \n",
+       "units                                         degF                           \n",
+       "description                                 223761        678 223762(degC)   \n",
+       "id     datetime            seg_id                                            \n",
+       "100001 2117-09-11 13:48:00 0                  98.0        NaN          NaN   \n",
+       "       2117-09-11 16:00:00 0                  97.9        NaN          NaN   \n",
+       "       2117-09-11 19:00:00 0                  99.5        NaN          NaN   \n",
+       "       2117-09-11 22:00:00 1                 100.0        NaN          NaN   \n",
+       "       2117-09-12 01:00:00 1                  99.9        NaN          NaN   \n",
+       "       2117-09-12 04:00:00 1                  97.7        NaN          NaN   \n",
+       "       2117-09-12 08:00:00 2                  97.8        NaN          NaN   \n",
+       "       2117-09-12 12:00:00 2                  97.5        NaN          NaN   \n",
+       "       2117-09-12 19:00:00 3                  99.8        NaN          NaN   \n",
+       "       2117-09-13 00:00:00 3                  99.7        NaN          NaN   \n",
+       "       2117-09-13 04:00:00 4                  99.3        NaN          NaN   \n",
+       "       2117-09-13 08:00:00 4                  99.4        NaN          NaN   \n",
+       "       2117-09-13 12:00:00 4                  98.8        NaN          NaN   \n",
+       "       2117-09-13 16:00:00 5                  99.3        NaN          NaN   \n",
+       "       2117-09-13 22:00:00 5                  99.9        NaN          NaN   \n",
+       "       2117-09-14 00:00:00 6                  99.4        NaN          NaN   \n",
+       "       2117-09-14 04:00:00 6                  99.6        NaN          NaN   \n",
+       "       2117-09-14 08:00:00 6                  99.0        NaN          NaN   \n",
+       "       2117-09-14 13:00:00 7                  98.0        NaN          NaN   \n",
+       "       2117-09-14 19:00:00 7                  99.5        NaN          NaN   \n",
+       "       2117-09-15 00:00:00 8                  99.6        NaN          NaN   \n",
+       "       2117-09-15 08:00:00 9                  98.3        NaN          NaN   \n",
+       "       2117-09-15 12:00:00 9                  97.8        NaN          NaN   \n",
+       "       2117-09-15 16:00:00 10                 98.6        NaN          NaN   \n",
+       "100003 2150-04-17 20:31:00 0                  95.9        NaN          NaN   \n",
+       "       2150-04-17 22:00:00 0                  98.2        NaN          NaN   \n",
+       "       2150-04-18 00:00:00 0                  97.4        NaN          NaN   \n",
+       "       2150-04-18 04:00:00 1                  98.0        NaN          NaN   \n",
+       "       2150-04-18 08:00:00 1                  97.4        NaN          NaN   \n",
+       "       2150-04-18 11:18:00 1                  96.3        NaN          NaN   \n",
+       "...                                            ...        ...          ...   \n",
+       "100114 2157-09-19 18:15:00 3                   NaN  98.400002          NaN   \n",
+       "       2157-09-19 18:30:00 3                   NaN  98.300003          NaN   \n",
+       "       2157-09-19 20:00:00 3                   NaN  98.400002          NaN   \n",
+       "       2157-09-19 23:00:00 3                   NaN  98.400002          NaN   \n",
+       "       2157-09-20 00:00:00 3                   NaN  98.599998          NaN   \n",
+       "       2157-09-20 01:00:00 3                   NaN  98.000000          NaN   \n",
+       "       2157-09-20 01:15:00 4                   NaN  98.199997          NaN   \n",
+       "       2157-09-20 02:00:00 4                   NaN  97.099998          NaN   \n",
+       "       2157-09-20 06:00:00 4                   NaN  98.000000          NaN   \n",
+       "       2157-09-20 08:00:00 4                   NaN  96.699997          NaN   \n",
+       "       2157-09-20 09:15:00 4                   NaN  96.900002          NaN   \n",
+       "       2157-09-20 09:30:00 4                   NaN  97.000000          NaN   \n",
+       "       2157-09-20 10:00:00 4                   NaN  96.900002          NaN   \n",
+       "       2157-09-20 12:00:00 5                   NaN  97.199997          NaN   \n",
+       "       2157-09-20 15:00:00 5                   NaN  98.400002          NaN   \n",
+       "       2157-09-20 18:00:00 5                   NaN  97.800003          NaN   \n",
+       "100116 2173-07-27 05:13:00 0                  98.9        NaN          NaN   \n",
+       "       2173-07-27 08:00:00 0                 100.0        NaN          NaN   \n",
+       "       2173-07-27 09:30:00 0                  99.7        NaN          NaN   \n",
+       "       2173-07-27 11:00:00 0                  98.7        NaN          NaN   \n",
+       "       2173-07-27 14:25:00 0                 100.4        NaN          NaN   \n",
+       "       2173-07-27 16:30:00 1                 100.3        NaN          NaN   \n",
+       "       2173-07-27 18:00:00 1                  99.9        NaN          NaN   \n",
+       "       2173-07-27 20:00:00 1                 100.3        NaN          NaN   \n",
+       "       2173-07-28 00:00:00 1                  99.7        NaN          NaN   \n",
+       "       2173-07-28 04:00:00 2                  98.5        NaN          NaN   \n",
+       "       2173-07-28 08:00:00 2                  99.4        NaN          NaN   \n",
+       "       2173-07-28 12:00:00 3                  98.5        NaN          NaN   \n",
+       "       2173-07-28 16:00:00 3                  99.4        NaN          NaN   \n",
+       "100117 2166-04-30 21:39:00 0                  99.7        NaN          NaN   \n",
+       "\n",
+       "label                                        \n",
+       "status                                       \n",
+       "variable_type                                \n",
+       "units                                        \n",
+       "description                       676(degC)  \n",
+       "id     datetime            seg_id            \n",
+       "100001 2117-09-11 13:48:00 0            NaN  \n",
+       "       2117-09-11 16:00:00 0            NaN  \n",
+       "       2117-09-11 19:00:00 0            NaN  \n",
+       "       2117-09-11 22:00:00 1            NaN  \n",
+       "       2117-09-12 01:00:00 1            NaN  \n",
+       "       2117-09-12 04:00:00 1            NaN  \n",
+       "       2117-09-12 08:00:00 2            NaN  \n",
+       "       2117-09-12 12:00:00 2            NaN  \n",
+       "       2117-09-12 19:00:00 3            NaN  \n",
+       "       2117-09-13 00:00:00 3            NaN  \n",
+       "       2117-09-13 04:00:00 4            NaN  \n",
+       "       2117-09-13 08:00:00 4            NaN  \n",
+       "       2117-09-13 12:00:00 4            NaN  \n",
+       "       2117-09-13 16:00:00 5            NaN  \n",
+       "       2117-09-13 22:00:00 5            NaN  \n",
+       "       2117-09-14 00:00:00 6            NaN  \n",
+       "       2117-09-14 04:00:00 6            NaN  \n",
+       "       2117-09-14 08:00:00 6            NaN  \n",
+       "       2117-09-14 13:00:00 7            NaN  \n",
+       "       2117-09-14 19:00:00 7            NaN  \n",
+       "       2117-09-15 00:00:00 8            NaN  \n",
+       "       2117-09-15 08:00:00 9            NaN  \n",
+       "       2117-09-15 12:00:00 9            NaN  \n",
+       "       2117-09-15 16:00:00 10           NaN  \n",
+       "100003 2150-04-17 20:31:00 0            NaN  \n",
+       "       2150-04-17 22:00:00 0            NaN  \n",
+       "       2150-04-18 00:00:00 0            NaN  \n",
+       "       2150-04-18 04:00:00 1            NaN  \n",
+       "       2150-04-18 08:00:00 1            NaN  \n",
+       "       2150-04-18 11:18:00 1            NaN  \n",
+       "...                                     ...  \n",
+       "100114 2157-09-19 18:15:00 3            NaN  \n",
+       "       2157-09-19 18:30:00 3            NaN  \n",
+       "       2157-09-19 20:00:00 3            NaN  \n",
+       "       2157-09-19 23:00:00 3            NaN  \n",
+       "       2157-09-20 00:00:00 3            NaN  \n",
+       "       2157-09-20 01:00:00 3            NaN  \n",
+       "       2157-09-20 01:15:00 4            NaN  \n",
+       "       2157-09-20 02:00:00 4            NaN  \n",
+       "       2157-09-20 06:00:00 4            NaN  \n",
+       "       2157-09-20 08:00:00 4            NaN  \n",
+       "       2157-09-20 09:15:00 4            NaN  \n",
+       "       2157-09-20 09:30:00 4            NaN  \n",
+       "       2157-09-20 10:00:00 4            NaN  \n",
+       "       2157-09-20 12:00:00 5            NaN  \n",
+       "       2157-09-20 15:00:00 5            NaN  \n",
+       "       2157-09-20 18:00:00 5            NaN  \n",
+       "100116 2173-07-27 05:13:00 0            NaN  \n",
+       "       2173-07-27 08:00:00 0            NaN  \n",
+       "       2173-07-27 09:30:00 0            NaN  \n",
+       "       2173-07-27 11:00:00 0            NaN  \n",
+       "       2173-07-27 14:25:00 0            NaN  \n",
+       "       2173-07-27 16:30:00 1            NaN  \n",
+       "       2173-07-27 18:00:00 1            NaN  \n",
+       "       2173-07-27 20:00:00 1            NaN  \n",
+       "       2173-07-28 00:00:00 1            NaN  \n",
+       "       2173-07-28 04:00:00 2            NaN  \n",
+       "       2173-07-28 08:00:00 2            NaN  \n",
+       "       2173-07-28 12:00:00 3            NaN  \n",
+       "       2173-07-28 16:00:00 3            NaN  \n",
+       "100117 2166-04-30 21:39:00 0            NaN  \n",
+       "\n",
+       "[2000 rows x 4 columns]"
+      ]
+     },
+     "execution_count": 266,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_temp_periodic = periodic.transform(df_temp_combined.head(2000))\n",
+    "df_temp_periodic[df_temp_periodic.index.get_level_values('seg_id') > -1]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 252,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import utils\n",
+    "import mimic\n",
+    "import transformers\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "import icu_data_defs\n",
+    "import units\n",
+    "import segmenting\n",
+    "from sklearn_pandas import DataFrameMapper\n",
+    "import constants\n",
+    "import features"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 251,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "hdf5_fname = 'data/mimic_data'\n",
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "df_cleaned"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 249,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "end_dt = df_temp_combined.iloc[:,0].groupby(level='id').apply(lambda x:x.sample(1))\n",
+    "end_dt = end_dt.reset_index(level=0,drop=True).reset_index(level=1,drop=False).iloc[:,0]\n",
+    "all_before = segmenting.all_before(end_dt,df_context)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Feature creation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 247,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "import utils\n",
+    "import transformers\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "import units\n",
+    "from sklearn_pandas import DataFrameMapper\n",
+    "import constants\n",
+    "import features"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 248,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "ename": "ImportError",
+     "evalue": "cannot import name CUSTOM_FILTER",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mImportError\u001b[0m                               Traceback (most recent call last)",
+      "\u001b[1;32m<ipython-input-248-bae7a29e5c29>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mfeatures\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      2\u001b[0m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mutils\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      3\u001b[0m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0munits\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      4\u001b[0m \u001b[0mreload\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mconstants\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      5\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\features.pyc\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;32mfrom\u001b[0m \u001b[0msklearn\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mbase\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mTransformerMixin\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mBaseEstimator\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      2\u001b[0m \u001b[1;32mfrom\u001b[0m \u001b[0msklearn\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mpipeline\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mFeatureUnion\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 3\u001b[1;33m \u001b[1;32mfrom\u001b[0m \u001b[0mconstants\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mcolumn_names\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mSEG_ID\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mNO_SEGMENT\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mALL\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mCUSTOM_FILTER\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      4\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mnumpy\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mnp\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      5\u001b[0m \u001b[1;32mfrom\u001b[0m \u001b[0msklearn_pandas\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mDataFrameMapper\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;31mImportError\u001b[0m: cannot import name CUSTOM_FILTER"
+     ]
+    }
+   ],
+   "source": [
+    "reload(features)\n",
+    "reload(utils)\n",
+    "reload(units)\n",
+    "reload(constants)\n",
+    "\n",
+    "df = df_temp_all_before\n",
+    "ureg = units.MedicalUreg()\n",
+    "\n",
+    "\n",
+    "\n",
+    "def summable_filter(df):\n",
+    "    filter_func= lambda x: (ureg.is_volume(str(x[-2])) or ureg.is_mass(str(x[-2]))) and (x[0] != 'weight body')\n",
+    "    return df.loc[:,df.columns.map(filter_func)]\n",
+    "\n",
+    "feature_tuples = [\n",
+    "    ('MEAN',features.segment_mean(),ALL),\n",
+    "    ('STD',features.segment_std(),ALL),\n",
+    "    ('COUNT',features.segment_count(),ALL),\n",
+    "    ('LAST',features.segment_last(),ALL),\n",
+    "    ('SUM',features.segment_sum(),{constants.CUSTOM_FILTER:summable_filter})\n",
+    "]\n",
+    "\n",
+    "mapped_ft = features.make_mapper(feature_tuples,df)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 232,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "feature_df = mapped_ft.transform(df)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 233,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>temperature body_degF_223761_MEAN</th>\n",
+       "      <th>temperature body_degF_678_MEAN</th>\n",
+       "      <th>temperature body_degC_223762_MEAN</th>\n",
+       "      <th>temperature body_degC_676_MEAN</th>\n",
+       "      <th>temperature body_degF_223761_STD</th>\n",
+       "      <th>temperature body_degF_678_STD</th>\n",
+       "      <th>temperature body_degC_223762_STD</th>\n",
+       "      <th>temperature body_degC_676_STD</th>\n",
+       "      <th>temperature body_degF_223761_COUNT</th>\n",
+       "      <th>temperature body_degF_678_COUNT</th>\n",
+       "      <th>temperature body_degC_223762_COUNT</th>\n",
+       "      <th>temperature body_degC_676_COUNT</th>\n",
+       "      <th>temperature body_degF_223761_LAST</th>\n",
+       "      <th>temperature body_degF_678_LAST</th>\n",
+       "      <th>temperature body_degC_223762_LAST</th>\n",
+       "      <th>temperature body_degC_676_LAST</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>98.537500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.064945</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>8.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>97.166667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.167619</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>95.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.533334</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.607729</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>21.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.591667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.466263</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>12.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.699997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>98.100000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.458258</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>98.550000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.036822</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>6.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>100.2</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>98.380000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.511765</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.641872</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.790767</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>34.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34.5</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.649998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.777816</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>101.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>97.975000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.875032</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>12.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>97.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>96.050000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.777817</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>96.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.536364</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.492489</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>11.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.378571</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.260705</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>14.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.6</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>99.466667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.495650</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>12.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.766037</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.374646</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>106.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.599998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>14</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>15</th>\n",
+       "      <td>98.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.141421</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>16</th>\n",
+       "      <td>100.772222</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.719512</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.075287</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.281265</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>18.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>41.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.5</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>17</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.193750</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.401560</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>32.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.799999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>18</th>\n",
+       "      <td>99.345455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.864975</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>33.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>19</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>20</th>\n",
+       "      <td>98.312500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.022986</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>16.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>97.6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>21</th>\n",
+       "      <td>97.760000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.585662</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>22</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.445455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.849254</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>22.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>23</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34.990909</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.190574</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>11.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>28.4</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>24</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.799999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.799999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.320000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.277491</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>26</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.700000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.754119</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>24.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>27</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.787487</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>10.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>28</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.847368</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.300681</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>19.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.200001</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>29</th>\n",
+       "      <td>96.525000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.450000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>96.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44216</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.302703</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.021739</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.047082</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.997311</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>37.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>46.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44217</th>\n",
+       "      <td>98.475000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.081280</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>4.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>97.1</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44218</th>\n",
+       "      <td>96.275000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.420034</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>8.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>96.3</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44219</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44220</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.740001</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.021275</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44221</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.672309</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44222</th>\n",
+       "      <td>99.240000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.512835</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>99.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44223</th>\n",
+       "      <td>98.450000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.070711</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44224</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.130000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.531351</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>10.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44225</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.199997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>4.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44226</th>\n",
+       "      <td>99.753333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.765195</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>15.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.7</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44227</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.071875</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.449181</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.944674</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.920982</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>32.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>61.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44228</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.526316</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.175605</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>19.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44229</th>\n",
+       "      <td>97.580000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.740570</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>10.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>96.9</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44230</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.443518</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.332443</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>108.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.299999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44231</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.071429</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.239964</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>14.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>35.599998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44232</th>\n",
+       "      <td>98.484375</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.070456</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>32.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>100.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44233</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.278462</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.300803</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>130.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44234</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.173333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.688131</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>15.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>35.0</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44235</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.074999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.056330</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>4.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.599998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44236</th>\n",
+       "      <td>97.977778</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.032930</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>9.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>98.4</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44237</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.485713</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.977118</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>7.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44238</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.264285</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.759157</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>14.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.599998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44239</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.565688</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.000000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44240</th>\n",
+       "      <td>95.800000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34.800000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34.8</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44241</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.670000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>37.420725</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.668415</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.378023</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>10.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>193.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.699997</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44242</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.980953</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.933605</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>21.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44243</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>35.750000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>0.919241</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>35.099998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44244</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>36.176191</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.159700</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>21.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>34.700001</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44245</th>\n",
+       "      <td>98.655000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>1.147297</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>20.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>97.8</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>44246 rows × 16 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       temperature body_degF_223761_MEAN  temperature body_degF_678_MEAN  \\\n",
+       "0                              98.537500                             NaN   \n",
+       "1                              97.166667                             NaN   \n",
+       "2                                    NaN                       97.533334   \n",
+       "3                                    NaN                       98.591667   \n",
+       "4                              98.100000                             NaN   \n",
+       "5                              98.550000                             NaN   \n",
+       "6                              98.380000                             NaN   \n",
+       "7                                    NaN                      100.649998   \n",
+       "8                              97.975000                             NaN   \n",
+       "9                              96.050000                             NaN   \n",
+       "10                                   NaN                       98.536364   \n",
+       "11                                   NaN                             NaN   \n",
+       "12                             99.466667                             NaN   \n",
+       "13                                   NaN                       99.099998   \n",
+       "14                                   NaN                       95.300003   \n",
+       "15                             98.500000                             NaN   \n",
+       "16                            100.772222                             NaN   \n",
+       "17                                   NaN                             NaN   \n",
+       "18                             99.345455                             NaN   \n",
+       "19                                   NaN                       98.800003   \n",
+       "20                             98.312500                             NaN   \n",
+       "21                             97.760000                             NaN   \n",
+       "22                                   NaN                       98.445455   \n",
+       "23                                   NaN                             NaN   \n",
+       "24                                   NaN                             NaN   \n",
+       "25                                   NaN                       97.320000   \n",
+       "26                                   NaN                       96.700000   \n",
+       "27                                   NaN                       96.920000   \n",
+       "28                                   NaN                             NaN   \n",
+       "29                             96.525000                             NaN   \n",
+       "...                                  ...                             ...   \n",
+       "44216                                NaN                       98.302703   \n",
+       "44217                          98.475000                             NaN   \n",
+       "44218                          96.275000                             NaN   \n",
+       "44219                                NaN                       97.800003   \n",
+       "44220                                NaN                       95.740001   \n",
+       "44221                                NaN                       97.920000   \n",
+       "44222                          99.240000                             NaN   \n",
+       "44223                          98.450000                             NaN   \n",
+       "44224                                NaN                       98.130000   \n",
+       "44225                                NaN                       97.900002   \n",
+       "44226                          99.753333                             NaN   \n",
+       "44227                                NaN                       98.071875   \n",
+       "44228                                NaN                      100.526316   \n",
+       "44229                          97.580000                             NaN   \n",
+       "44230                                NaN                             NaN   \n",
+       "44231                                NaN                             NaN   \n",
+       "44232                          98.484375                             NaN   \n",
+       "44233                                NaN                      100.278462   \n",
+       "44234                                NaN                             NaN   \n",
+       "44235                                NaN                       97.074999   \n",
+       "44236                          97.977778                             NaN   \n",
+       "44237                                NaN                       97.485713   \n",
+       "44238                                NaN                       97.264285   \n",
+       "44239                                NaN                       95.400002   \n",
+       "44240                          95.800000                             NaN   \n",
+       "44241                                NaN                       97.670000   \n",
+       "44242                                NaN                       98.980953   \n",
+       "44243                                NaN                             NaN   \n",
+       "44244                                NaN                             NaN   \n",
+       "44245                          98.655000                             NaN   \n",
+       "\n",
+       "       temperature body_degC_223762_MEAN  temperature body_degC_676_MEAN  \\\n",
+       "0                                    NaN                             NaN   \n",
+       "1                                    NaN                             NaN   \n",
+       "2                                    NaN                             NaN   \n",
+       "3                                    NaN                             NaN   \n",
+       "4                                    NaN                             NaN   \n",
+       "5                                    NaN                             NaN   \n",
+       "6                              36.511765                             NaN   \n",
+       "7                                    NaN                             NaN   \n",
+       "8                                    NaN                             NaN   \n",
+       "9                                    NaN                             NaN   \n",
+       "10                                   NaN                             NaN   \n",
+       "11                             36.378571                             NaN   \n",
+       "12                                   NaN                             NaN   \n",
+       "13                                   NaN                       36.766037   \n",
+       "14                                   NaN                             NaN   \n",
+       "15                                   NaN                             NaN   \n",
+       "16                             37.719512                             NaN   \n",
+       "17                                   NaN                       37.193750   \n",
+       "18                                   NaN                             NaN   \n",
+       "19                                   NaN                             NaN   \n",
+       "20                                   NaN                             NaN   \n",
+       "21                                   NaN                             NaN   \n",
+       "22                                   NaN                             NaN   \n",
+       "23                             34.990909                             NaN   \n",
+       "24                                   NaN                       36.799999   \n",
+       "25                                   NaN                             NaN   \n",
+       "26                                   NaN                             NaN   \n",
+       "27                                   NaN                             NaN   \n",
+       "28                                   NaN                       36.847368   \n",
+       "29                                   NaN                             NaN   \n",
+       "...                                  ...                             ...   \n",
+       "44216                                NaN                       37.021739   \n",
+       "44217                                NaN                             NaN   \n",
+       "44218                                NaN                             NaN   \n",
+       "44219                                NaN                             NaN   \n",
+       "44220                                NaN                             NaN   \n",
+       "44221                                NaN                             NaN   \n",
+       "44222                                NaN                             NaN   \n",
+       "44223                                NaN                             NaN   \n",
+       "44224                                NaN                             NaN   \n",
+       "44225                                NaN                             NaN   \n",
+       "44226                                NaN                             NaN   \n",
+       "44227                                NaN                       37.449181   \n",
+       "44228                                NaN                             NaN   \n",
+       "44229                                NaN                             NaN   \n",
+       "44230                                NaN                       37.443518   \n",
+       "44231                                NaN                       36.071429   \n",
+       "44232                                NaN                             NaN   \n",
+       "44233                                NaN                             NaN   \n",
+       "44234                          36.173333                             NaN   \n",
+       "44235                                NaN                             NaN   \n",
+       "44236                                NaN                             NaN   \n",
+       "44237                                NaN                             NaN   \n",
+       "44238                                NaN                             NaN   \n",
+       "44239                                NaN                             NaN   \n",
+       "44240                          34.800000                             NaN   \n",
+       "44241                                NaN                       37.420725   \n",
+       "44242                                NaN                             NaN   \n",
+       "44243                                NaN                       35.750000   \n",
+       "44244                                NaN                       36.176191   \n",
+       "44245                                NaN                             NaN   \n",
+       "\n",
+       "       temperature body_degF_223761_STD  temperature body_degF_678_STD  \\\n",
+       "0                              1.064945                            NaN   \n",
+       "1                              1.167619                            NaN   \n",
+       "2                                   NaN                       0.607729   \n",
+       "3                                   NaN                       1.466263   \n",
+       "4                              0.458258                            NaN   \n",
+       "5                              1.036822                            NaN   \n",
+       "6                              0.641872                            NaN   \n",
+       "7                                   NaN                       0.777816   \n",
+       "8                              0.875032                            NaN   \n",
+       "9                              0.777817                            NaN   \n",
+       "10                                  NaN                       0.492489   \n",
+       "11                                  NaN                            NaN   \n",
+       "12                             1.495650                            NaN   \n",
+       "13                                  NaN                            NaN   \n",
+       "14                                  NaN                            NaN   \n",
+       "15                             0.141421                            NaN   \n",
+       "16                             1.075287                            NaN   \n",
+       "17                                  NaN                            NaN   \n",
+       "18                             0.864975                            NaN   \n",
+       "19                                  NaN                            NaN   \n",
+       "20                             1.022986                            NaN   \n",
+       "21                             0.585662                            NaN   \n",
+       "22                                  NaN                       1.849254   \n",
+       "23                                  NaN                            NaN   \n",
+       "24                                  NaN                            NaN   \n",
+       "25                                  NaN                       0.277491   \n",
+       "26                                  NaN                       0.754119   \n",
+       "27                                  NaN                       1.787487   \n",
+       "28                                  NaN                            NaN   \n",
+       "29                             0.450000                            NaN   \n",
+       "...                                 ...                            ...   \n",
+       "44216                               NaN                       1.047082   \n",
+       "44217                          1.081280                            NaN   \n",
+       "44218                          0.420034                            NaN   \n",
+       "44219                               NaN                            NaN   \n",
+       "44220                               NaN                       1.021275   \n",
+       "44221                               NaN                       0.672309   \n",
+       "44222                          0.512835                            NaN   \n",
+       "44223                          0.070711                            NaN   \n",
+       "44224                               NaN                       0.531351   \n",
+       "44225                               NaN                       0.199997   \n",
+       "44226                          0.765195                            NaN   \n",
+       "44227                               NaN                       0.944674   \n",
+       "44228                               NaN                       1.175605   \n",
+       "44229                          0.740570                            NaN   \n",
+       "44230                               NaN                            NaN   \n",
+       "44231                               NaN                            NaN   \n",
+       "44232                          1.070456                            NaN   \n",
+       "44233                               NaN                       1.300803   \n",
+       "44234                               NaN                            NaN   \n",
+       "44235                               NaN                       1.056330   \n",
+       "44236                          1.032930                            NaN   \n",
+       "44237                               NaN                       0.977118   \n",
+       "44238                               NaN                       0.759157   \n",
+       "44239                               NaN                       0.565688   \n",
+       "44240                               NaN                            NaN   \n",
+       "44241                               NaN                       0.668415   \n",
+       "44242                               NaN                       0.933605   \n",
+       "44243                               NaN                            NaN   \n",
+       "44244                               NaN                            NaN   \n",
+       "44245                          1.147297                            NaN   \n",
+       "\n",
+       "       temperature body_degC_223762_STD  temperature body_degC_676_STD  \\\n",
+       "0                                   NaN                            NaN   \n",
+       "1                                   NaN                            NaN   \n",
+       "2                                   NaN                            NaN   \n",
+       "3                                   NaN                            NaN   \n",
+       "4                                   NaN                            NaN   \n",
+       "5                                   NaN                            NaN   \n",
+       "6                              0.790767                            NaN   \n",
+       "7                                   NaN                            NaN   \n",
+       "8                                   NaN                            NaN   \n",
+       "9                                   NaN                            NaN   \n",
+       "10                                  NaN                            NaN   \n",
+       "11                             0.260705                            NaN   \n",
+       "12                                  NaN                            NaN   \n",
+       "13                                  NaN                       0.374646   \n",
+       "14                                  NaN                            NaN   \n",
+       "15                                  NaN                            NaN   \n",
+       "16                             0.281265                            NaN   \n",
+       "17                                  NaN                       0.401560   \n",
+       "18                                  NaN                            NaN   \n",
+       "19                                  NaN                            NaN   \n",
+       "20                                  NaN                            NaN   \n",
+       "21                                  NaN                            NaN   \n",
+       "22                                  NaN                            NaN   \n",
+       "23                             4.190574                            NaN   \n",
+       "24                                  NaN                            NaN   \n",
+       "25                                  NaN                            NaN   \n",
+       "26                                  NaN                            NaN   \n",
+       "27                                  NaN                            NaN   \n",
+       "28                                  NaN                       0.300681   \n",
+       "29                                  NaN                            NaN   \n",
+       "...                                 ...                            ...   \n",
+       "44216                               NaN                       0.997311   \n",
+       "44217                               NaN                            NaN   \n",
+       "44218                               NaN                            NaN   \n",
+       "44219                               NaN                            NaN   \n",
+       "44220                               NaN                            NaN   \n",
+       "44221                               NaN                            NaN   \n",
+       "44222                               NaN                            NaN   \n",
+       "44223                               NaN                            NaN   \n",
+       "44224                               NaN                            NaN   \n",
+       "44225                               NaN                            NaN   \n",
+       "44226                               NaN                            NaN   \n",
+       "44227                               NaN                       0.920982   \n",
+       "44228                               NaN                            NaN   \n",
+       "44229                               NaN                            NaN   \n",
+       "44230                               NaN                       0.332443   \n",
+       "44231                               NaN                       0.239964   \n",
+       "44232                               NaN                            NaN   \n",
+       "44233                               NaN                            NaN   \n",
+       "44234                          0.688131                            NaN   \n",
+       "44235                               NaN                            NaN   \n",
+       "44236                               NaN                            NaN   \n",
+       "44237                               NaN                            NaN   \n",
+       "44238                               NaN                            NaN   \n",
+       "44239                               NaN                            NaN   \n",
+       "44240                               NaN                            NaN   \n",
+       "44241                               NaN                       0.378023   \n",
+       "44242                               NaN                            NaN   \n",
+       "44243                               NaN                       0.919241   \n",
+       "44244                               NaN                       1.159700   \n",
+       "44245                               NaN                            NaN   \n",
+       "\n",
+       "       temperature body_degF_223761_COUNT  temperature body_degF_678_COUNT  \\\n",
+       "0                                     8.0                              0.0   \n",
+       "1                                     3.0                              0.0   \n",
+       "2                                     0.0                             21.0   \n",
+       "3                                     0.0                             12.0   \n",
+       "4                                     3.0                              0.0   \n",
+       "5                                     6.0                              0.0   \n",
+       "6                                     5.0                              0.0   \n",
+       "7                                     0.0                              2.0   \n",
+       "8                                    12.0                              0.0   \n",
+       "9                                     2.0                              0.0   \n",
+       "10                                    0.0                             11.0   \n",
+       "11                                    0.0                              0.0   \n",
+       "12                                   12.0                              0.0   \n",
+       "13                                    0.0                              1.0   \n",
+       "14                                    0.0                              1.0   \n",
+       "15                                    2.0                              0.0   \n",
+       "16                                   18.0                              0.0   \n",
+       "17                                    0.0                              0.0   \n",
+       "18                                   33.0                              0.0   \n",
+       "19                                    0.0                              1.0   \n",
+       "20                                   16.0                              0.0   \n",
+       "21                                    5.0                              0.0   \n",
+       "22                                    0.0                             22.0   \n",
+       "23                                    0.0                              0.0   \n",
+       "24                                    0.0                              0.0   \n",
+       "25                                    0.0                              5.0   \n",
+       "26                                    0.0                             24.0   \n",
+       "27                                    0.0                             10.0   \n",
+       "28                                    0.0                              0.0   \n",
+       "29                                    4.0                              0.0   \n",
+       "...                                   ...                              ...   \n",
+       "44216                                 0.0                             37.0   \n",
+       "44217                                 4.0                              0.0   \n",
+       "44218                                 8.0                              0.0   \n",
+       "44219                                 0.0                              1.0   \n",
+       "44220                                 0.0                              5.0   \n",
+       "44221                                 0.0                              5.0   \n",
+       "44222                                 5.0                              0.0   \n",
+       "44223                                 2.0                              0.0   \n",
+       "44224                                 0.0                             10.0   \n",
+       "44225                                 0.0                              4.0   \n",
+       "44226                                15.0                              0.0   \n",
+       "44227                                 0.0                             32.0   \n",
+       "44228                                 0.0                             19.0   \n",
+       "44229                                10.0                              0.0   \n",
+       "44230                                 0.0                              0.0   \n",
+       "44231                                 0.0                              0.0   \n",
+       "44232                                32.0                              0.0   \n",
+       "44233                                 0.0                            130.0   \n",
+       "44234                                 0.0                              0.0   \n",
+       "44235                                 0.0                              4.0   \n",
+       "44236                                 9.0                              0.0   \n",
+       "44237                                 0.0                              7.0   \n",
+       "44238                                 0.0                             14.0   \n",
+       "44239                                 0.0                              2.0   \n",
+       "44240                                 1.0                              0.0   \n",
+       "44241                                 0.0                             10.0   \n",
+       "44242                                 0.0                             21.0   \n",
+       "44243                                 0.0                              0.0   \n",
+       "44244                                 0.0                              0.0   \n",
+       "44245                                20.0                              0.0   \n",
+       "\n",
+       "       temperature body_degC_223762_COUNT  temperature body_degC_676_COUNT  \\\n",
+       "0                                     0.0                              0.0   \n",
+       "1                                     0.0                              0.0   \n",
+       "2                                     0.0                              0.0   \n",
+       "3                                     0.0                              0.0   \n",
+       "4                                     0.0                              0.0   \n",
+       "5                                     0.0                              0.0   \n",
+       "6                                    34.0                              0.0   \n",
+       "7                                     0.0                              0.0   \n",
+       "8                                     0.0                              0.0   \n",
+       "9                                     0.0                              0.0   \n",
+       "10                                    0.0                              0.0   \n",
+       "11                                   14.0                              0.0   \n",
+       "12                                    0.0                              0.0   \n",
+       "13                                    0.0                            106.0   \n",
+       "14                                    0.0                              0.0   \n",
+       "15                                    0.0                              0.0   \n",
+       "16                                   41.0                              0.0   \n",
+       "17                                    0.0                             32.0   \n",
+       "18                                    0.0                              0.0   \n",
+       "19                                    0.0                              0.0   \n",
+       "20                                    0.0                              0.0   \n",
+       "21                                    0.0                              0.0   \n",
+       "22                                    0.0                              0.0   \n",
+       "23                                   11.0                              0.0   \n",
+       "24                                    0.0                              1.0   \n",
+       "25                                    0.0                              0.0   \n",
+       "26                                    0.0                              0.0   \n",
+       "27                                    0.0                              0.0   \n",
+       "28                                    0.0                             19.0   \n",
+       "29                                    0.0                              0.0   \n",
+       "...                                   ...                              ...   \n",
+       "44216                                 0.0                             46.0   \n",
+       "44217                                 0.0                              0.0   \n",
+       "44218                                 0.0                              0.0   \n",
+       "44219                                 0.0                              0.0   \n",
+       "44220                                 0.0                              0.0   \n",
+       "44221                                 0.0                              0.0   \n",
+       "44222                                 0.0                              0.0   \n",
+       "44223                                 0.0                              0.0   \n",
+       "44224                                 0.0                              0.0   \n",
+       "44225                                 0.0                              0.0   \n",
+       "44226                                 0.0                              0.0   \n",
+       "44227                                 0.0                             61.0   \n",
+       "44228                                 0.0                              0.0   \n",
+       "44229                                 0.0                              0.0   \n",
+       "44230                                 0.0                            108.0   \n",
+       "44231                                 0.0                             14.0   \n",
+       "44232                                 0.0                              0.0   \n",
+       "44233                                 0.0                              0.0   \n",
+       "44234                                15.0                              0.0   \n",
+       "44235                                 0.0                              0.0   \n",
+       "44236                                 0.0                              0.0   \n",
+       "44237                                 0.0                              0.0   \n",
+       "44238                                 0.0                              0.0   \n",
+       "44239                                 0.0                              0.0   \n",
+       "44240                                 1.0                              0.0   \n",
+       "44241                                 0.0                            193.0   \n",
+       "44242                                 0.0                              0.0   \n",
+       "44243                                 0.0                              2.0   \n",
+       "44244                                 0.0                             21.0   \n",
+       "44245                                 0.0                              0.0   \n",
+       "\n",
+       "       temperature body_degF_223761_LAST  temperature body_degF_678_LAST  \\\n",
+       "0                                   98.0                             NaN   \n",
+       "1                                   95.9                             NaN   \n",
+       "2                                    NaN                       97.000000   \n",
+       "3                                    NaN                       95.699997   \n",
+       "4                                   98.6                             NaN   \n",
+       "5                                  100.2                             NaN   \n",
+       "6                                    NaN                             NaN   \n",
+       "7                                    NaN                      101.199997   \n",
+       "8                                   97.4                             NaN   \n",
+       "9                                   96.6                             NaN   \n",
+       "10                                   NaN                       98.500000   \n",
+       "11                                   NaN                             NaN   \n",
+       "12                                  98.8                             NaN   \n",
+       "13                                   NaN                             NaN   \n",
+       "14                                   NaN                       95.300003   \n",
+       "15                                  98.6                             NaN   \n",
+       "16                                   NaN                             NaN   \n",
+       "17                                   NaN                             NaN   \n",
+       "18                                  98.6                             NaN   \n",
+       "19                                   NaN                       98.800003   \n",
+       "20                                  97.6                             NaN   \n",
+       "21                                  97.8                             NaN   \n",
+       "22                                   NaN                       97.800003   \n",
+       "23                                   NaN                             NaN   \n",
+       "24                                   NaN                             NaN   \n",
+       "25                                   NaN                       97.199997   \n",
+       "26                                   NaN                       97.000000   \n",
+       "27                                   NaN                       94.000000   \n",
+       "28                                   NaN                             NaN   \n",
+       "29                                  96.9                             NaN   \n",
+       "...                                  ...                             ...   \n",
+       "44216                                NaN                       96.000000   \n",
+       "44217                               97.1                             NaN   \n",
+       "44218                               96.3                             NaN   \n",
+       "44219                                NaN                       97.800003   \n",
+       "44220                                NaN                       94.099998   \n",
+       "44221                                NaN                       97.099998   \n",
+       "44222                               99.8                             NaN   \n",
+       "44223                               98.4                             NaN   \n",
+       "44224                                NaN                       97.800003   \n",
+       "44225                                NaN                       97.800003   \n",
+       "44226                               98.7                             NaN   \n",
+       "44227                                NaN                             NaN   \n",
+       "44228                                NaN                       98.000000   \n",
+       "44229                               96.9                             NaN   \n",
+       "44230                                NaN                             NaN   \n",
+       "44231                                NaN                             NaN   \n",
+       "44232                              100.0                             NaN   \n",
+       "44233                                NaN                       97.900002   \n",
+       "44234                                NaN                             NaN   \n",
+       "44235                                NaN                       95.599998   \n",
+       "44236                               98.4                             NaN   \n",
+       "44237                                NaN                       95.900002   \n",
+       "44238                                NaN                       96.599998   \n",
+       "44239                                NaN                       95.000000   \n",
+       "44240                                NaN                             NaN   \n",
+       "44241                                NaN                       98.699997   \n",
+       "44242                                NaN                       99.400002   \n",
+       "44243                                NaN                             NaN   \n",
+       "44244                                NaN                             NaN   \n",
+       "44245                               97.8                             NaN   \n",
+       "\n",
+       "       temperature body_degC_223762_LAST  temperature body_degC_676_LAST  \n",
+       "0                                    NaN                             NaN  \n",
+       "1                                    NaN                             NaN  \n",
+       "2                                    NaN                             NaN  \n",
+       "3                                    NaN                             NaN  \n",
+       "4                                    NaN                             NaN  \n",
+       "5                                    NaN                             NaN  \n",
+       "6                                   34.5                             NaN  \n",
+       "7                                    NaN                             NaN  \n",
+       "8                                    NaN                             NaN  \n",
+       "9                                    NaN                             NaN  \n",
+       "10                                   NaN                             NaN  \n",
+       "11                                  36.6                             NaN  \n",
+       "12                                   NaN                             NaN  \n",
+       "13                                   NaN                       36.599998  \n",
+       "14                                   NaN                             NaN  \n",
+       "15                                   NaN                             NaN  \n",
+       "16                                  37.5                             NaN  \n",
+       "17                                   NaN                       36.799999  \n",
+       "18                                   NaN                             NaN  \n",
+       "19                                   NaN                             NaN  \n",
+       "20                                   NaN                             NaN  \n",
+       "21                                   NaN                             NaN  \n",
+       "22                                   NaN                             NaN  \n",
+       "23                                  28.4                             NaN  \n",
+       "24                                   NaN                       36.799999  \n",
+       "25                                   NaN                             NaN  \n",
+       "26                                   NaN                             NaN  \n",
+       "27                                   NaN                             NaN  \n",
+       "28                                   NaN                       36.200001  \n",
+       "29                                   NaN                             NaN  \n",
+       "...                                  ...                             ...  \n",
+       "44216                                NaN                             NaN  \n",
+       "44217                                NaN                             NaN  \n",
+       "44218                                NaN                             NaN  \n",
+       "44219                                NaN                             NaN  \n",
+       "44220                                NaN                             NaN  \n",
+       "44221                                NaN                             NaN  \n",
+       "44222                                NaN                             NaN  \n",
+       "44223                                NaN                             NaN  \n",
+       "44224                                NaN                             NaN  \n",
+       "44225                                NaN                             NaN  \n",
+       "44226                                NaN                             NaN  \n",
+       "44227                                NaN                       34.500000  \n",
+       "44228                                NaN                             NaN  \n",
+       "44229                                NaN                             NaN  \n",
+       "44230                                NaN                       37.299999  \n",
+       "44231                                NaN                       35.599998  \n",
+       "44232                                NaN                             NaN  \n",
+       "44233                                NaN                             NaN  \n",
+       "44234                               35.0                             NaN  \n",
+       "44235                                NaN                             NaN  \n",
+       "44236                                NaN                             NaN  \n",
+       "44237                                NaN                             NaN  \n",
+       "44238                                NaN                             NaN  \n",
+       "44239                                NaN                             NaN  \n",
+       "44240                               34.8                             NaN  \n",
+       "44241                                NaN                             NaN  \n",
+       "44242                                NaN                             NaN  \n",
+       "44243                                NaN                       35.099998  \n",
+       "44244                                NaN                       34.700001  \n",
+       "44245                                NaN                             NaN  \n",
+       "\n",
+       "[44246 rows x 16 columns]"
+      ]
+     },
+     "execution_count": 233,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "feature_df"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 120,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "test_mapper_pipeline = Pipeline([\n",
+    "        ('ft_mapper',mapped_ft)\n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 121,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>temperature body_known_qn_degF_223761_MEAN</th>\n",
+       "      <th>temperature body_known_qn_degF_678_MEAN</th>\n",
+       "      <th>temperature body_known_qn_degF_223762(degC)_MEAN</th>\n",
+       "      <th>temperature body_known_qn_degF_676(degC)_MEAN</th>\n",
+       "      <th>temperature body_known_qn_degF_223761_STD</th>\n",
+       "      <th>temperature body_known_qn_degF_678_STD</th>\n",
+       "      <th>temperature body_known_qn_degF_223762(degC)_STD</th>\n",
+       "      <th>temperature body_known_qn_degF_676(degC)_STD</th>\n",
+       "      <th>temperature body_known_qn_degF_223761_COUNT</th>\n",
+       "      <th>temperature body_known_qn_degF_678_COUNT</th>\n",
+       "      <th>temperature body_known_qn_degF_223762(degC)_COUNT</th>\n",
+       "      <th>temperature body_known_qn_degF_676(degC)_COUNT</th>\n",
+       "      <th>temperature body_known_qn_degF_223761_LAST</th>\n",
+       "      <th>temperature body_known_qn_degF_678_LAST</th>\n",
+       "      <th>temperature body_known_qn_degF_223762(degC)_LAST</th>\n",
+       "      <th>temperature body_known_qn_degF_676(degC)_LAST</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>98.537500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.537500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.537500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.537500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>97.166667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.166667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.166667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.166667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.533334</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.533334</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.533334</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.533334</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.591667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.591667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.591667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.591667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>98.100000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.100000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.100000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.100000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>98.550000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.550000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.550000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.550000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>98.380000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.721177</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.380000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.721177</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.380000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.721177</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.380000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.721177</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.649998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.649998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.649998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.649998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>97.975000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.975000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.975000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.975000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>96.050000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.050000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.050000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.050000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.536364</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.536364</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.536364</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.536364</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.481429</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.481429</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.481429</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.481429</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12</th>\n",
+       "      <td>99.466667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.466667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.466667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.466667</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>13</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.178868</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.178868</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.178868</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.099998</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.178868</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>14</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.300003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>15</th>\n",
+       "      <td>98.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.500000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>16</th>\n",
+       "      <td>100.772222</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.895122</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.772222</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.895122</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.772222</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.895122</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.772222</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.895122</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>17</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.948750</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.948750</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.948750</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.948750</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>18</th>\n",
+       "      <td>99.345455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.345455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.345455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.345455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>19</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>20</th>\n",
+       "      <td>98.312500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.312500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.312500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.312500</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>21</th>\n",
+       "      <td>97.760000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.760000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.760000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.760000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>22</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.445455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.445455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.445455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.445455</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>23</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.983637</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.983637</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.983637</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.983637</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>24</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.239999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.239999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.239999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.239999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.320000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.320000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.320000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.320000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>26</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.700000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.700000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.700000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.700000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>27</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>28</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.325263</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.325263</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.325263</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.325263</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>29</th>\n",
+       "      <td>96.525000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.525000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.525000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.525000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44216</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.302703</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.639131</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.302703</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.639131</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.302703</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.639131</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.302703</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.639131</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44217</th>\n",
+       "      <td>98.475000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.475000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.475000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.475000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44218</th>\n",
+       "      <td>96.275000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.275000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.275000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.275000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44219</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.800003</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44220</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.740001</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.740001</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.740001</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.740001</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44221</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.920000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44222</th>\n",
+       "      <td>99.240000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.240000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.240000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.240000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44223</th>\n",
+       "      <td>98.450000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.450000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.450000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.450000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44224</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.130000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.130000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.130000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.130000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44225</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.900002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44226</th>\n",
+       "      <td>99.753333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.753333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.753333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.753333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44227</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.071875</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.408525</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.071875</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.408525</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.071875</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.408525</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.071875</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.408525</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44228</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.526316</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.526316</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.526316</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.526316</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44229</th>\n",
+       "      <td>97.580000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.580000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.580000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.580000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44230</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.398333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.398333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.398333</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.398333</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44231</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.928572</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.928572</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.928572</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.928572</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44232</th>\n",
+       "      <td>98.484375</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.484375</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.484375</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.484375</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44233</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.278462</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.278462</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.278462</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>100.278462</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44234</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.112000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.112000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.112000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.112000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44235</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.074999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.074999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.074999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.074999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44236</th>\n",
+       "      <td>97.977778</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.977778</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.977778</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.977778</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44237</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.485713</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.485713</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.485713</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.485713</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44238</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.264285</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.264285</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.264285</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.264285</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44239</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.400002</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44240</th>\n",
+       "      <td>95.800000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.640000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.800000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.640000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.800000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.640000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>95.800000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>94.640000</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44241</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.670000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.357306</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.670000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.357306</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.670000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.357306</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.670000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>99.357306</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44242</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.980953</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.980953</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.980953</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.980953</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44243</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.350000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.350000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.350000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>96.350000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44244</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.117143</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.117143</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.117143</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>97.117143</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>44245</th>\n",
+       "      <td>98.655000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.655000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.655000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>98.655000</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>44246 rows × 16 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       temperature body_known_qn_degF_223761_MEAN  \\\n",
+       "0                                       98.537500   \n",
+       "1                                       97.166667   \n",
+       "2                                             NaN   \n",
+       "3                                             NaN   \n",
+       "4                                       98.100000   \n",
+       "5                                       98.550000   \n",
+       "6                                       98.380000   \n",
+       "7                                             NaN   \n",
+       "8                                       97.975000   \n",
+       "9                                       96.050000   \n",
+       "10                                            NaN   \n",
+       "11                                            NaN   \n",
+       "12                                      99.466667   \n",
+       "13                                            NaN   \n",
+       "14                                            NaN   \n",
+       "15                                      98.500000   \n",
+       "16                                     100.772222   \n",
+       "17                                            NaN   \n",
+       "18                                      99.345455   \n",
+       "19                                            NaN   \n",
+       "20                                      98.312500   \n",
+       "21                                      97.760000   \n",
+       "22                                            NaN   \n",
+       "23                                            NaN   \n",
+       "24                                            NaN   \n",
+       "25                                            NaN   \n",
+       "26                                            NaN   \n",
+       "27                                            NaN   \n",
+       "28                                            NaN   \n",
+       "29                                      96.525000   \n",
+       "...                                           ...   \n",
+       "44216                                         NaN   \n",
+       "44217                                   98.475000   \n",
+       "44218                                   96.275000   \n",
+       "44219                                         NaN   \n",
+       "44220                                         NaN   \n",
+       "44221                                         NaN   \n",
+       "44222                                   99.240000   \n",
+       "44223                                   98.450000   \n",
+       "44224                                         NaN   \n",
+       "44225                                         NaN   \n",
+       "44226                                   99.753333   \n",
+       "44227                                         NaN   \n",
+       "44228                                         NaN   \n",
+       "44229                                   97.580000   \n",
+       "44230                                         NaN   \n",
+       "44231                                         NaN   \n",
+       "44232                                   98.484375   \n",
+       "44233                                         NaN   \n",
+       "44234                                         NaN   \n",
+       "44235                                         NaN   \n",
+       "44236                                   97.977778   \n",
+       "44237                                         NaN   \n",
+       "44238                                         NaN   \n",
+       "44239                                         NaN   \n",
+       "44240                                   95.800000   \n",
+       "44241                                         NaN   \n",
+       "44242                                         NaN   \n",
+       "44243                                         NaN   \n",
+       "44244                                         NaN   \n",
+       "44245                                   98.655000   \n",
+       "\n",
+       "       temperature body_known_qn_degF_678_MEAN  \\\n",
+       "0                                          NaN   \n",
+       "1                                          NaN   \n",
+       "2                                    97.533334   \n",
+       "3                                    98.591667   \n",
+       "4                                          NaN   \n",
+       "5                                          NaN   \n",
+       "6                                          NaN   \n",
+       "7                                   100.649998   \n",
+       "8                                          NaN   \n",
+       "9                                          NaN   \n",
+       "10                                   98.536364   \n",
+       "11                                         NaN   \n",
+       "12                                         NaN   \n",
+       "13                                   99.099998   \n",
+       "14                                   95.300003   \n",
+       "15                                         NaN   \n",
+       "16                                         NaN   \n",
+       "17                                         NaN   \n",
+       "18                                         NaN   \n",
+       "19                                   98.800003   \n",
+       "20                                         NaN   \n",
+       "21                                         NaN   \n",
+       "22                                   98.445455   \n",
+       "23                                         NaN   \n",
+       "24                                         NaN   \n",
+       "25                                   97.320000   \n",
+       "26                                   96.700000   \n",
+       "27                                   96.920000   \n",
+       "28                                         NaN   \n",
+       "29                                         NaN   \n",
+       "...                                        ...   \n",
+       "44216                                98.302703   \n",
+       "44217                                      NaN   \n",
+       "44218                                      NaN   \n",
+       "44219                                97.800003   \n",
+       "44220                                95.740001   \n",
+       "44221                                97.920000   \n",
+       "44222                                      NaN   \n",
+       "44223                                      NaN   \n",
+       "44224                                98.130000   \n",
+       "44225                                97.900002   \n",
+       "44226                                      NaN   \n",
+       "44227                                98.071875   \n",
+       "44228                               100.526316   \n",
+       "44229                                      NaN   \n",
+       "44230                                      NaN   \n",
+       "44231                                      NaN   \n",
+       "44232                                      NaN   \n",
+       "44233                               100.278462   \n",
+       "44234                                      NaN   \n",
+       "44235                                97.074999   \n",
+       "44236                                      NaN   \n",
+       "44237                                97.485713   \n",
+       "44238                                97.264285   \n",
+       "44239                                95.400002   \n",
+       "44240                                      NaN   \n",
+       "44241                                97.670000   \n",
+       "44242                                98.980953   \n",
+       "44243                                      NaN   \n",
+       "44244                                      NaN   \n",
+       "44245                                      NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223762(degC)_MEAN  \\\n",
+       "0                                                   NaN   \n",
+       "1                                                   NaN   \n",
+       "2                                                   NaN   \n",
+       "3                                                   NaN   \n",
+       "4                                                   NaN   \n",
+       "5                                                   NaN   \n",
+       "6                                             97.721177   \n",
+       "7                                                   NaN   \n",
+       "8                                                   NaN   \n",
+       "9                                                   NaN   \n",
+       "10                                                  NaN   \n",
+       "11                                            97.481429   \n",
+       "12                                                  NaN   \n",
+       "13                                                  NaN   \n",
+       "14                                                  NaN   \n",
+       "15                                                  NaN   \n",
+       "16                                            99.895122   \n",
+       "17                                                  NaN   \n",
+       "18                                                  NaN   \n",
+       "19                                                  NaN   \n",
+       "20                                                  NaN   \n",
+       "21                                                  NaN   \n",
+       "22                                                  NaN   \n",
+       "23                                            94.983637   \n",
+       "24                                                  NaN   \n",
+       "25                                                  NaN   \n",
+       "26                                                  NaN   \n",
+       "27                                                  NaN   \n",
+       "28                                                  NaN   \n",
+       "29                                                  NaN   \n",
+       "...                                                 ...   \n",
+       "44216                                               NaN   \n",
+       "44217                                               NaN   \n",
+       "44218                                               NaN   \n",
+       "44219                                               NaN   \n",
+       "44220                                               NaN   \n",
+       "44221                                               NaN   \n",
+       "44222                                               NaN   \n",
+       "44223                                               NaN   \n",
+       "44224                                               NaN   \n",
+       "44225                                               NaN   \n",
+       "44226                                               NaN   \n",
+       "44227                                               NaN   \n",
+       "44228                                               NaN   \n",
+       "44229                                               NaN   \n",
+       "44230                                               NaN   \n",
+       "44231                                               NaN   \n",
+       "44232                                               NaN   \n",
+       "44233                                               NaN   \n",
+       "44234                                         97.112000   \n",
+       "44235                                               NaN   \n",
+       "44236                                               NaN   \n",
+       "44237                                               NaN   \n",
+       "44238                                               NaN   \n",
+       "44239                                               NaN   \n",
+       "44240                                         94.640000   \n",
+       "44241                                               NaN   \n",
+       "44242                                               NaN   \n",
+       "44243                                               NaN   \n",
+       "44244                                               NaN   \n",
+       "44245                                               NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_676(degC)_MEAN  \\\n",
+       "0                                                NaN   \n",
+       "1                                                NaN   \n",
+       "2                                                NaN   \n",
+       "3                                                NaN   \n",
+       "4                                                NaN   \n",
+       "5                                                NaN   \n",
+       "6                                                NaN   \n",
+       "7                                                NaN   \n",
+       "8                                                NaN   \n",
+       "9                                                NaN   \n",
+       "10                                               NaN   \n",
+       "11                                               NaN   \n",
+       "12                                               NaN   \n",
+       "13                                         98.178868   \n",
+       "14                                               NaN   \n",
+       "15                                               NaN   \n",
+       "16                                               NaN   \n",
+       "17                                         98.948750   \n",
+       "18                                               NaN   \n",
+       "19                                               NaN   \n",
+       "20                                               NaN   \n",
+       "21                                               NaN   \n",
+       "22                                               NaN   \n",
+       "23                                               NaN   \n",
+       "24                                         98.239999   \n",
+       "25                                               NaN   \n",
+       "26                                               NaN   \n",
+       "27                                               NaN   \n",
+       "28                                         98.325263   \n",
+       "29                                               NaN   \n",
+       "...                                              ...   \n",
+       "44216                                      98.639131   \n",
+       "44217                                            NaN   \n",
+       "44218                                            NaN   \n",
+       "44219                                            NaN   \n",
+       "44220                                            NaN   \n",
+       "44221                                            NaN   \n",
+       "44222                                            NaN   \n",
+       "44223                                            NaN   \n",
+       "44224                                            NaN   \n",
+       "44225                                            NaN   \n",
+       "44226                                            NaN   \n",
+       "44227                                      99.408525   \n",
+       "44228                                            NaN   \n",
+       "44229                                            NaN   \n",
+       "44230                                      99.398333   \n",
+       "44231                                      96.928572   \n",
+       "44232                                            NaN   \n",
+       "44233                                            NaN   \n",
+       "44234                                            NaN   \n",
+       "44235                                            NaN   \n",
+       "44236                                            NaN   \n",
+       "44237                                            NaN   \n",
+       "44238                                            NaN   \n",
+       "44239                                            NaN   \n",
+       "44240                                            NaN   \n",
+       "44241                                      99.357306   \n",
+       "44242                                            NaN   \n",
+       "44243                                      96.350000   \n",
+       "44244                                      97.117143   \n",
+       "44245                                            NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223761_STD  \\\n",
+       "0                                      98.537500   \n",
+       "1                                      97.166667   \n",
+       "2                                            NaN   \n",
+       "3                                            NaN   \n",
+       "4                                      98.100000   \n",
+       "5                                      98.550000   \n",
+       "6                                      98.380000   \n",
+       "7                                            NaN   \n",
+       "8                                      97.975000   \n",
+       "9                                      96.050000   \n",
+       "10                                           NaN   \n",
+       "11                                           NaN   \n",
+       "12                                     99.466667   \n",
+       "13                                           NaN   \n",
+       "14                                           NaN   \n",
+       "15                                     98.500000   \n",
+       "16                                    100.772222   \n",
+       "17                                           NaN   \n",
+       "18                                     99.345455   \n",
+       "19                                           NaN   \n",
+       "20                                     98.312500   \n",
+       "21                                     97.760000   \n",
+       "22                                           NaN   \n",
+       "23                                           NaN   \n",
+       "24                                           NaN   \n",
+       "25                                           NaN   \n",
+       "26                                           NaN   \n",
+       "27                                           NaN   \n",
+       "28                                           NaN   \n",
+       "29                                     96.525000   \n",
+       "...                                          ...   \n",
+       "44216                                        NaN   \n",
+       "44217                                  98.475000   \n",
+       "44218                                  96.275000   \n",
+       "44219                                        NaN   \n",
+       "44220                                        NaN   \n",
+       "44221                                        NaN   \n",
+       "44222                                  99.240000   \n",
+       "44223                                  98.450000   \n",
+       "44224                                        NaN   \n",
+       "44225                                        NaN   \n",
+       "44226                                  99.753333   \n",
+       "44227                                        NaN   \n",
+       "44228                                        NaN   \n",
+       "44229                                  97.580000   \n",
+       "44230                                        NaN   \n",
+       "44231                                        NaN   \n",
+       "44232                                  98.484375   \n",
+       "44233                                        NaN   \n",
+       "44234                                        NaN   \n",
+       "44235                                        NaN   \n",
+       "44236                                  97.977778   \n",
+       "44237                                        NaN   \n",
+       "44238                                        NaN   \n",
+       "44239                                        NaN   \n",
+       "44240                                  95.800000   \n",
+       "44241                                        NaN   \n",
+       "44242                                        NaN   \n",
+       "44243                                        NaN   \n",
+       "44244                                        NaN   \n",
+       "44245                                  98.655000   \n",
+       "\n",
+       "       temperature body_known_qn_degF_678_STD  \\\n",
+       "0                                         NaN   \n",
+       "1                                         NaN   \n",
+       "2                                   97.533334   \n",
+       "3                                   98.591667   \n",
+       "4                                         NaN   \n",
+       "5                                         NaN   \n",
+       "6                                         NaN   \n",
+       "7                                  100.649998   \n",
+       "8                                         NaN   \n",
+       "9                                         NaN   \n",
+       "10                                  98.536364   \n",
+       "11                                        NaN   \n",
+       "12                                        NaN   \n",
+       "13                                  99.099998   \n",
+       "14                                  95.300003   \n",
+       "15                                        NaN   \n",
+       "16                                        NaN   \n",
+       "17                                        NaN   \n",
+       "18                                        NaN   \n",
+       "19                                  98.800003   \n",
+       "20                                        NaN   \n",
+       "21                                        NaN   \n",
+       "22                                  98.445455   \n",
+       "23                                        NaN   \n",
+       "24                                        NaN   \n",
+       "25                                  97.320000   \n",
+       "26                                  96.700000   \n",
+       "27                                  96.920000   \n",
+       "28                                        NaN   \n",
+       "29                                        NaN   \n",
+       "...                                       ...   \n",
+       "44216                               98.302703   \n",
+       "44217                                     NaN   \n",
+       "44218                                     NaN   \n",
+       "44219                               97.800003   \n",
+       "44220                               95.740001   \n",
+       "44221                               97.920000   \n",
+       "44222                                     NaN   \n",
+       "44223                                     NaN   \n",
+       "44224                               98.130000   \n",
+       "44225                               97.900002   \n",
+       "44226                                     NaN   \n",
+       "44227                               98.071875   \n",
+       "44228                              100.526316   \n",
+       "44229                                     NaN   \n",
+       "44230                                     NaN   \n",
+       "44231                                     NaN   \n",
+       "44232                                     NaN   \n",
+       "44233                              100.278462   \n",
+       "44234                                     NaN   \n",
+       "44235                               97.074999   \n",
+       "44236                                     NaN   \n",
+       "44237                               97.485713   \n",
+       "44238                               97.264285   \n",
+       "44239                               95.400002   \n",
+       "44240                                     NaN   \n",
+       "44241                               97.670000   \n",
+       "44242                               98.980953   \n",
+       "44243                                     NaN   \n",
+       "44244                                     NaN   \n",
+       "44245                                     NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223762(degC)_STD  \\\n",
+       "0                                                  NaN   \n",
+       "1                                                  NaN   \n",
+       "2                                                  NaN   \n",
+       "3                                                  NaN   \n",
+       "4                                                  NaN   \n",
+       "5                                                  NaN   \n",
+       "6                                            97.721177   \n",
+       "7                                                  NaN   \n",
+       "8                                                  NaN   \n",
+       "9                                                  NaN   \n",
+       "10                                                 NaN   \n",
+       "11                                           97.481429   \n",
+       "12                                                 NaN   \n",
+       "13                                                 NaN   \n",
+       "14                                                 NaN   \n",
+       "15                                                 NaN   \n",
+       "16                                           99.895122   \n",
+       "17                                                 NaN   \n",
+       "18                                                 NaN   \n",
+       "19                                                 NaN   \n",
+       "20                                                 NaN   \n",
+       "21                                                 NaN   \n",
+       "22                                                 NaN   \n",
+       "23                                           94.983637   \n",
+       "24                                                 NaN   \n",
+       "25                                                 NaN   \n",
+       "26                                                 NaN   \n",
+       "27                                                 NaN   \n",
+       "28                                                 NaN   \n",
+       "29                                                 NaN   \n",
+       "...                                                ...   \n",
+       "44216                                              NaN   \n",
+       "44217                                              NaN   \n",
+       "44218                                              NaN   \n",
+       "44219                                              NaN   \n",
+       "44220                                              NaN   \n",
+       "44221                                              NaN   \n",
+       "44222                                              NaN   \n",
+       "44223                                              NaN   \n",
+       "44224                                              NaN   \n",
+       "44225                                              NaN   \n",
+       "44226                                              NaN   \n",
+       "44227                                              NaN   \n",
+       "44228                                              NaN   \n",
+       "44229                                              NaN   \n",
+       "44230                                              NaN   \n",
+       "44231                                              NaN   \n",
+       "44232                                              NaN   \n",
+       "44233                                              NaN   \n",
+       "44234                                        97.112000   \n",
+       "44235                                              NaN   \n",
+       "44236                                              NaN   \n",
+       "44237                                              NaN   \n",
+       "44238                                              NaN   \n",
+       "44239                                              NaN   \n",
+       "44240                                        94.640000   \n",
+       "44241                                              NaN   \n",
+       "44242                                              NaN   \n",
+       "44243                                              NaN   \n",
+       "44244                                              NaN   \n",
+       "44245                                              NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_676(degC)_STD  \\\n",
+       "0                                               NaN   \n",
+       "1                                               NaN   \n",
+       "2                                               NaN   \n",
+       "3                                               NaN   \n",
+       "4                                               NaN   \n",
+       "5                                               NaN   \n",
+       "6                                               NaN   \n",
+       "7                                               NaN   \n",
+       "8                                               NaN   \n",
+       "9                                               NaN   \n",
+       "10                                              NaN   \n",
+       "11                                              NaN   \n",
+       "12                                              NaN   \n",
+       "13                                        98.178868   \n",
+       "14                                              NaN   \n",
+       "15                                              NaN   \n",
+       "16                                              NaN   \n",
+       "17                                        98.948750   \n",
+       "18                                              NaN   \n",
+       "19                                              NaN   \n",
+       "20                                              NaN   \n",
+       "21                                              NaN   \n",
+       "22                                              NaN   \n",
+       "23                                              NaN   \n",
+       "24                                        98.239999   \n",
+       "25                                              NaN   \n",
+       "26                                              NaN   \n",
+       "27                                              NaN   \n",
+       "28                                        98.325263   \n",
+       "29                                              NaN   \n",
+       "...                                             ...   \n",
+       "44216                                     98.639131   \n",
+       "44217                                           NaN   \n",
+       "44218                                           NaN   \n",
+       "44219                                           NaN   \n",
+       "44220                                           NaN   \n",
+       "44221                                           NaN   \n",
+       "44222                                           NaN   \n",
+       "44223                                           NaN   \n",
+       "44224                                           NaN   \n",
+       "44225                                           NaN   \n",
+       "44226                                           NaN   \n",
+       "44227                                     99.408525   \n",
+       "44228                                           NaN   \n",
+       "44229                                           NaN   \n",
+       "44230                                     99.398333   \n",
+       "44231                                     96.928572   \n",
+       "44232                                           NaN   \n",
+       "44233                                           NaN   \n",
+       "44234                                           NaN   \n",
+       "44235                                           NaN   \n",
+       "44236                                           NaN   \n",
+       "44237                                           NaN   \n",
+       "44238                                           NaN   \n",
+       "44239                                           NaN   \n",
+       "44240                                           NaN   \n",
+       "44241                                     99.357306   \n",
+       "44242                                           NaN   \n",
+       "44243                                     96.350000   \n",
+       "44244                                     97.117143   \n",
+       "44245                                           NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223761_COUNT  \\\n",
+       "0                                        98.537500   \n",
+       "1                                        97.166667   \n",
+       "2                                              NaN   \n",
+       "3                                              NaN   \n",
+       "4                                        98.100000   \n",
+       "5                                        98.550000   \n",
+       "6                                        98.380000   \n",
+       "7                                              NaN   \n",
+       "8                                        97.975000   \n",
+       "9                                        96.050000   \n",
+       "10                                             NaN   \n",
+       "11                                             NaN   \n",
+       "12                                       99.466667   \n",
+       "13                                             NaN   \n",
+       "14                                             NaN   \n",
+       "15                                       98.500000   \n",
+       "16                                      100.772222   \n",
+       "17                                             NaN   \n",
+       "18                                       99.345455   \n",
+       "19                                             NaN   \n",
+       "20                                       98.312500   \n",
+       "21                                       97.760000   \n",
+       "22                                             NaN   \n",
+       "23                                             NaN   \n",
+       "24                                             NaN   \n",
+       "25                                             NaN   \n",
+       "26                                             NaN   \n",
+       "27                                             NaN   \n",
+       "28                                             NaN   \n",
+       "29                                       96.525000   \n",
+       "...                                            ...   \n",
+       "44216                                          NaN   \n",
+       "44217                                    98.475000   \n",
+       "44218                                    96.275000   \n",
+       "44219                                          NaN   \n",
+       "44220                                          NaN   \n",
+       "44221                                          NaN   \n",
+       "44222                                    99.240000   \n",
+       "44223                                    98.450000   \n",
+       "44224                                          NaN   \n",
+       "44225                                          NaN   \n",
+       "44226                                    99.753333   \n",
+       "44227                                          NaN   \n",
+       "44228                                          NaN   \n",
+       "44229                                    97.580000   \n",
+       "44230                                          NaN   \n",
+       "44231                                          NaN   \n",
+       "44232                                    98.484375   \n",
+       "44233                                          NaN   \n",
+       "44234                                          NaN   \n",
+       "44235                                          NaN   \n",
+       "44236                                    97.977778   \n",
+       "44237                                          NaN   \n",
+       "44238                                          NaN   \n",
+       "44239                                          NaN   \n",
+       "44240                                    95.800000   \n",
+       "44241                                          NaN   \n",
+       "44242                                          NaN   \n",
+       "44243                                          NaN   \n",
+       "44244                                          NaN   \n",
+       "44245                                    98.655000   \n",
+       "\n",
+       "       temperature body_known_qn_degF_678_COUNT  \\\n",
+       "0                                           NaN   \n",
+       "1                                           NaN   \n",
+       "2                                     97.533334   \n",
+       "3                                     98.591667   \n",
+       "4                                           NaN   \n",
+       "5                                           NaN   \n",
+       "6                                           NaN   \n",
+       "7                                    100.649998   \n",
+       "8                                           NaN   \n",
+       "9                                           NaN   \n",
+       "10                                    98.536364   \n",
+       "11                                          NaN   \n",
+       "12                                          NaN   \n",
+       "13                                    99.099998   \n",
+       "14                                    95.300003   \n",
+       "15                                          NaN   \n",
+       "16                                          NaN   \n",
+       "17                                          NaN   \n",
+       "18                                          NaN   \n",
+       "19                                    98.800003   \n",
+       "20                                          NaN   \n",
+       "21                                          NaN   \n",
+       "22                                    98.445455   \n",
+       "23                                          NaN   \n",
+       "24                                          NaN   \n",
+       "25                                    97.320000   \n",
+       "26                                    96.700000   \n",
+       "27                                    96.920000   \n",
+       "28                                          NaN   \n",
+       "29                                          NaN   \n",
+       "...                                         ...   \n",
+       "44216                                 98.302703   \n",
+       "44217                                       NaN   \n",
+       "44218                                       NaN   \n",
+       "44219                                 97.800003   \n",
+       "44220                                 95.740001   \n",
+       "44221                                 97.920000   \n",
+       "44222                                       NaN   \n",
+       "44223                                       NaN   \n",
+       "44224                                 98.130000   \n",
+       "44225                                 97.900002   \n",
+       "44226                                       NaN   \n",
+       "44227                                 98.071875   \n",
+       "44228                                100.526316   \n",
+       "44229                                       NaN   \n",
+       "44230                                       NaN   \n",
+       "44231                                       NaN   \n",
+       "44232                                       NaN   \n",
+       "44233                                100.278462   \n",
+       "44234                                       NaN   \n",
+       "44235                                 97.074999   \n",
+       "44236                                       NaN   \n",
+       "44237                                 97.485713   \n",
+       "44238                                 97.264285   \n",
+       "44239                                 95.400002   \n",
+       "44240                                       NaN   \n",
+       "44241                                 97.670000   \n",
+       "44242                                 98.980953   \n",
+       "44243                                       NaN   \n",
+       "44244                                       NaN   \n",
+       "44245                                       NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223762(degC)_COUNT  \\\n",
+       "0                                                    NaN   \n",
+       "1                                                    NaN   \n",
+       "2                                                    NaN   \n",
+       "3                                                    NaN   \n",
+       "4                                                    NaN   \n",
+       "5                                                    NaN   \n",
+       "6                                              97.721177   \n",
+       "7                                                    NaN   \n",
+       "8                                                    NaN   \n",
+       "9                                                    NaN   \n",
+       "10                                                   NaN   \n",
+       "11                                             97.481429   \n",
+       "12                                                   NaN   \n",
+       "13                                                   NaN   \n",
+       "14                                                   NaN   \n",
+       "15                                                   NaN   \n",
+       "16                                             99.895122   \n",
+       "17                                                   NaN   \n",
+       "18                                                   NaN   \n",
+       "19                                                   NaN   \n",
+       "20                                                   NaN   \n",
+       "21                                                   NaN   \n",
+       "22                                                   NaN   \n",
+       "23                                             94.983637   \n",
+       "24                                                   NaN   \n",
+       "25                                                   NaN   \n",
+       "26                                                   NaN   \n",
+       "27                                                   NaN   \n",
+       "28                                                   NaN   \n",
+       "29                                                   NaN   \n",
+       "...                                                  ...   \n",
+       "44216                                                NaN   \n",
+       "44217                                                NaN   \n",
+       "44218                                                NaN   \n",
+       "44219                                                NaN   \n",
+       "44220                                                NaN   \n",
+       "44221                                                NaN   \n",
+       "44222                                                NaN   \n",
+       "44223                                                NaN   \n",
+       "44224                                                NaN   \n",
+       "44225                                                NaN   \n",
+       "44226                                                NaN   \n",
+       "44227                                                NaN   \n",
+       "44228                                                NaN   \n",
+       "44229                                                NaN   \n",
+       "44230                                                NaN   \n",
+       "44231                                                NaN   \n",
+       "44232                                                NaN   \n",
+       "44233                                                NaN   \n",
+       "44234                                          97.112000   \n",
+       "44235                                                NaN   \n",
+       "44236                                                NaN   \n",
+       "44237                                                NaN   \n",
+       "44238                                                NaN   \n",
+       "44239                                                NaN   \n",
+       "44240                                          94.640000   \n",
+       "44241                                                NaN   \n",
+       "44242                                                NaN   \n",
+       "44243                                                NaN   \n",
+       "44244                                                NaN   \n",
+       "44245                                                NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_676(degC)_COUNT  \\\n",
+       "0                                                 NaN   \n",
+       "1                                                 NaN   \n",
+       "2                                                 NaN   \n",
+       "3                                                 NaN   \n",
+       "4                                                 NaN   \n",
+       "5                                                 NaN   \n",
+       "6                                                 NaN   \n",
+       "7                                                 NaN   \n",
+       "8                                                 NaN   \n",
+       "9                                                 NaN   \n",
+       "10                                                NaN   \n",
+       "11                                                NaN   \n",
+       "12                                                NaN   \n",
+       "13                                          98.178868   \n",
+       "14                                                NaN   \n",
+       "15                                                NaN   \n",
+       "16                                                NaN   \n",
+       "17                                          98.948750   \n",
+       "18                                                NaN   \n",
+       "19                                                NaN   \n",
+       "20                                                NaN   \n",
+       "21                                                NaN   \n",
+       "22                                                NaN   \n",
+       "23                                                NaN   \n",
+       "24                                          98.239999   \n",
+       "25                                                NaN   \n",
+       "26                                                NaN   \n",
+       "27                                                NaN   \n",
+       "28                                          98.325263   \n",
+       "29                                                NaN   \n",
+       "...                                               ...   \n",
+       "44216                                       98.639131   \n",
+       "44217                                             NaN   \n",
+       "44218                                             NaN   \n",
+       "44219                                             NaN   \n",
+       "44220                                             NaN   \n",
+       "44221                                             NaN   \n",
+       "44222                                             NaN   \n",
+       "44223                                             NaN   \n",
+       "44224                                             NaN   \n",
+       "44225                                             NaN   \n",
+       "44226                                             NaN   \n",
+       "44227                                       99.408525   \n",
+       "44228                                             NaN   \n",
+       "44229                                             NaN   \n",
+       "44230                                       99.398333   \n",
+       "44231                                       96.928572   \n",
+       "44232                                             NaN   \n",
+       "44233                                             NaN   \n",
+       "44234                                             NaN   \n",
+       "44235                                             NaN   \n",
+       "44236                                             NaN   \n",
+       "44237                                             NaN   \n",
+       "44238                                             NaN   \n",
+       "44239                                             NaN   \n",
+       "44240                                             NaN   \n",
+       "44241                                       99.357306   \n",
+       "44242                                             NaN   \n",
+       "44243                                       96.350000   \n",
+       "44244                                       97.117143   \n",
+       "44245                                             NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223761_LAST  \\\n",
+       "0                                       98.537500   \n",
+       "1                                       97.166667   \n",
+       "2                                             NaN   \n",
+       "3                                             NaN   \n",
+       "4                                       98.100000   \n",
+       "5                                       98.550000   \n",
+       "6                                       98.380000   \n",
+       "7                                             NaN   \n",
+       "8                                       97.975000   \n",
+       "9                                       96.050000   \n",
+       "10                                            NaN   \n",
+       "11                                            NaN   \n",
+       "12                                      99.466667   \n",
+       "13                                            NaN   \n",
+       "14                                            NaN   \n",
+       "15                                      98.500000   \n",
+       "16                                     100.772222   \n",
+       "17                                            NaN   \n",
+       "18                                      99.345455   \n",
+       "19                                            NaN   \n",
+       "20                                      98.312500   \n",
+       "21                                      97.760000   \n",
+       "22                                            NaN   \n",
+       "23                                            NaN   \n",
+       "24                                            NaN   \n",
+       "25                                            NaN   \n",
+       "26                                            NaN   \n",
+       "27                                            NaN   \n",
+       "28                                            NaN   \n",
+       "29                                      96.525000   \n",
+       "...                                           ...   \n",
+       "44216                                         NaN   \n",
+       "44217                                   98.475000   \n",
+       "44218                                   96.275000   \n",
+       "44219                                         NaN   \n",
+       "44220                                         NaN   \n",
+       "44221                                         NaN   \n",
+       "44222                                   99.240000   \n",
+       "44223                                   98.450000   \n",
+       "44224                                         NaN   \n",
+       "44225                                         NaN   \n",
+       "44226                                   99.753333   \n",
+       "44227                                         NaN   \n",
+       "44228                                         NaN   \n",
+       "44229                                   97.580000   \n",
+       "44230                                         NaN   \n",
+       "44231                                         NaN   \n",
+       "44232                                   98.484375   \n",
+       "44233                                         NaN   \n",
+       "44234                                         NaN   \n",
+       "44235                                         NaN   \n",
+       "44236                                   97.977778   \n",
+       "44237                                         NaN   \n",
+       "44238                                         NaN   \n",
+       "44239                                         NaN   \n",
+       "44240                                   95.800000   \n",
+       "44241                                         NaN   \n",
+       "44242                                         NaN   \n",
+       "44243                                         NaN   \n",
+       "44244                                         NaN   \n",
+       "44245                                   98.655000   \n",
+       "\n",
+       "       temperature body_known_qn_degF_678_LAST  \\\n",
+       "0                                          NaN   \n",
+       "1                                          NaN   \n",
+       "2                                    97.533334   \n",
+       "3                                    98.591667   \n",
+       "4                                          NaN   \n",
+       "5                                          NaN   \n",
+       "6                                          NaN   \n",
+       "7                                   100.649998   \n",
+       "8                                          NaN   \n",
+       "9                                          NaN   \n",
+       "10                                   98.536364   \n",
+       "11                                         NaN   \n",
+       "12                                         NaN   \n",
+       "13                                   99.099998   \n",
+       "14                                   95.300003   \n",
+       "15                                         NaN   \n",
+       "16                                         NaN   \n",
+       "17                                         NaN   \n",
+       "18                                         NaN   \n",
+       "19                                   98.800003   \n",
+       "20                                         NaN   \n",
+       "21                                         NaN   \n",
+       "22                                   98.445455   \n",
+       "23                                         NaN   \n",
+       "24                                         NaN   \n",
+       "25                                   97.320000   \n",
+       "26                                   96.700000   \n",
+       "27                                   96.920000   \n",
+       "28                                         NaN   \n",
+       "29                                         NaN   \n",
+       "...                                        ...   \n",
+       "44216                                98.302703   \n",
+       "44217                                      NaN   \n",
+       "44218                                      NaN   \n",
+       "44219                                97.800003   \n",
+       "44220                                95.740001   \n",
+       "44221                                97.920000   \n",
+       "44222                                      NaN   \n",
+       "44223                                      NaN   \n",
+       "44224                                98.130000   \n",
+       "44225                                97.900002   \n",
+       "44226                                      NaN   \n",
+       "44227                                98.071875   \n",
+       "44228                               100.526316   \n",
+       "44229                                      NaN   \n",
+       "44230                                      NaN   \n",
+       "44231                                      NaN   \n",
+       "44232                                      NaN   \n",
+       "44233                               100.278462   \n",
+       "44234                                      NaN   \n",
+       "44235                                97.074999   \n",
+       "44236                                      NaN   \n",
+       "44237                                97.485713   \n",
+       "44238                                97.264285   \n",
+       "44239                                95.400002   \n",
+       "44240                                      NaN   \n",
+       "44241                                97.670000   \n",
+       "44242                                98.980953   \n",
+       "44243                                      NaN   \n",
+       "44244                                      NaN   \n",
+       "44245                                      NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_223762(degC)_LAST  \\\n",
+       "0                                                   NaN   \n",
+       "1                                                   NaN   \n",
+       "2                                                   NaN   \n",
+       "3                                                   NaN   \n",
+       "4                                                   NaN   \n",
+       "5                                                   NaN   \n",
+       "6                                             97.721177   \n",
+       "7                                                   NaN   \n",
+       "8                                                   NaN   \n",
+       "9                                                   NaN   \n",
+       "10                                                  NaN   \n",
+       "11                                            97.481429   \n",
+       "12                                                  NaN   \n",
+       "13                                                  NaN   \n",
+       "14                                                  NaN   \n",
+       "15                                                  NaN   \n",
+       "16                                            99.895122   \n",
+       "17                                                  NaN   \n",
+       "18                                                  NaN   \n",
+       "19                                                  NaN   \n",
+       "20                                                  NaN   \n",
+       "21                                                  NaN   \n",
+       "22                                                  NaN   \n",
+       "23                                            94.983637   \n",
+       "24                                                  NaN   \n",
+       "25                                                  NaN   \n",
+       "26                                                  NaN   \n",
+       "27                                                  NaN   \n",
+       "28                                                  NaN   \n",
+       "29                                                  NaN   \n",
+       "...                                                 ...   \n",
+       "44216                                               NaN   \n",
+       "44217                                               NaN   \n",
+       "44218                                               NaN   \n",
+       "44219                                               NaN   \n",
+       "44220                                               NaN   \n",
+       "44221                                               NaN   \n",
+       "44222                                               NaN   \n",
+       "44223                                               NaN   \n",
+       "44224                                               NaN   \n",
+       "44225                                               NaN   \n",
+       "44226                                               NaN   \n",
+       "44227                                               NaN   \n",
+       "44228                                               NaN   \n",
+       "44229                                               NaN   \n",
+       "44230                                               NaN   \n",
+       "44231                                               NaN   \n",
+       "44232                                               NaN   \n",
+       "44233                                               NaN   \n",
+       "44234                                         97.112000   \n",
+       "44235                                               NaN   \n",
+       "44236                                               NaN   \n",
+       "44237                                               NaN   \n",
+       "44238                                               NaN   \n",
+       "44239                                               NaN   \n",
+       "44240                                         94.640000   \n",
+       "44241                                               NaN   \n",
+       "44242                                               NaN   \n",
+       "44243                                               NaN   \n",
+       "44244                                               NaN   \n",
+       "44245                                               NaN   \n",
+       "\n",
+       "       temperature body_known_qn_degF_676(degC)_LAST  \n",
+       "0                                                NaN  \n",
+       "1                                                NaN  \n",
+       "2                                                NaN  \n",
+       "3                                                NaN  \n",
+       "4                                                NaN  \n",
+       "5                                                NaN  \n",
+       "6                                                NaN  \n",
+       "7                                                NaN  \n",
+       "8                                                NaN  \n",
+       "9                                                NaN  \n",
+       "10                                               NaN  \n",
+       "11                                               NaN  \n",
+       "12                                               NaN  \n",
+       "13                                         98.178868  \n",
+       "14                                               NaN  \n",
+       "15                                               NaN  \n",
+       "16                                               NaN  \n",
+       "17                                         98.948750  \n",
+       "18                                               NaN  \n",
+       "19                                               NaN  \n",
+       "20                                               NaN  \n",
+       "21                                               NaN  \n",
+       "22                                               NaN  \n",
+       "23                                               NaN  \n",
+       "24                                         98.239999  \n",
+       "25                                               NaN  \n",
+       "26                                               NaN  \n",
+       "27                                               NaN  \n",
+       "28                                         98.325263  \n",
+       "29                                               NaN  \n",
+       "...                                              ...  \n",
+       "44216                                      98.639131  \n",
+       "44217                                            NaN  \n",
+       "44218                                            NaN  \n",
+       "44219                                            NaN  \n",
+       "44220                                            NaN  \n",
+       "44221                                            NaN  \n",
+       "44222                                            NaN  \n",
+       "44223                                            NaN  \n",
+       "44224                                            NaN  \n",
+       "44225                                            NaN  \n",
+       "44226                                            NaN  \n",
+       "44227                                      99.408525  \n",
+       "44228                                            NaN  \n",
+       "44229                                            NaN  \n",
+       "44230                                      99.398333  \n",
+       "44231                                      96.928572  \n",
+       "44232                                            NaN  \n",
+       "44233                                            NaN  \n",
+       "44234                                            NaN  \n",
+       "44235                                            NaN  \n",
+       "44236                                            NaN  \n",
+       "44237                                            NaN  \n",
+       "44238                                            NaN  \n",
+       "44239                                            NaN  \n",
+       "44240                                            NaN  \n",
+       "44241                                      99.357306  \n",
+       "44242                                            NaN  \n",
+       "44243                                      96.350000  \n",
+       "44244                                      97.117143  \n",
+       "44245                                            NaN  \n",
+       "\n",
+       "[44246 rows x 16 columns]"
+      ]
+     },
+     "execution_count": 121,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "test_mapper_pipeline.transform(df)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 152,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<units.MedicalUreg at 0x31082eb8>"
+      ]
+     },
+     "execution_count": 152,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "ureg"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 197,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "mass = ureg.parse_units('degF')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 198,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<UnitsContainer({'[temperature]': 1.0})>"
+      ]
+     },
+     "execution_count": 198,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "mass.dimensionality"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 157,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from pint.unit import UnitsContainer"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 160,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "True"
+      ]
+     },
+     "execution_count": 160,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "units.dimensionality == UnitsContainer({'[length]':3.0})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 166,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "1e-06 kilogram"
+      ],
+      "text/latex": [
+       "$1e-06\\ \\mathrm{kilogram}$"
+      ],
+      "text/plain": [
+       "<Quantity(1e-06, 'kilogram')>"
+      ]
+     },
+     "execution_count": 166,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "(1*units).to_base_units()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 161,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "uc = UnitsContainer({'[length]':3.0})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "uc.dim"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "import constants\n",
+    "import mimic\n",
+    "import utils\n",
+    "import pandas as pd\n",
+    "import icu_data_defs\n",
+    "import units\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "import transformers\n",
+    "import logger\n",
+    "import features\n",
+    "import warnings\n",
+    "warnings.filterwarnings('ignore')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 36,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(mimic)\n",
+    "reload(units)\n",
+    "reload(utils)\n",
+    "reload(transformers)\n",
+    "def mimic_ETL(components,data_dict,hdf5_fname,\n",
+    "              hadm_ids=constants.ALL,\n",
+    "              agg_func=lambda x:x.iloc[0]):\n",
+    "    \n",
+    "    logger.log('BEGIN ETL for {} admissions'.format(hadm_ids if hadm_ids == constants.ALL else len(hadm_ids)),new_level=True)\n",
+    "    category_map = mimic.mimic_category_map(data_dict)\n",
+    "    ureg = units.MedicalUreg()\n",
+    "    extractor = mimic.mimic_extractor('config/mimic_item_map.csv',data_dict)\n",
+    "    \n",
+    "\n",
+    "    transform_pipeline = mimic.transform_pipeline()\n",
+    "\n",
+    "    standard_clean_pipeline = Pipeline([\n",
+    "        ('aggregate_same_datetime',transformers.same_index_aggregator(agg_func)),\n",
+    "        ('split_dtype',transformers.split_dtype()),\n",
+    "        ('standardize_columns',transformers.column_standardizer(data_dict,ureg)),\n",
+    "        ('standardize_categories',transformers.standardize_categories(data_dict,category_map)),\n",
+    "        ('split_bad_categories',transformers.split_bad_categories(data_dict)),\n",
+    "        ('one_hotter',transformers.nominal_to_onehot()),\n",
+    "        ('drop_oob_values',transformers.oob_value_remover(data_dict))\n",
+    "    ])\n",
+    "    \n",
+    "\n",
+    "    logger.log('Extract CONTEXT...')\n",
+    "    df_context = mimic.get_context_data(hadm_ids)\n",
+    "    utils.save_df(df_context,hdf5_fname,'context')\n",
+    "\n",
+    "    \n",
+    "    for component in components:\n",
+    "        logger.log(component.upper(),new_level=True)\n",
+    "        \n",
+    "        logger.log(\"Extracting...\",new_level=True)\n",
+    "        df_extracted = extractor.extract_component(component,hadm_ids)\n",
+    "        utils.save_df(df_extracted,hdf5_fname,'extracted/{}'.format(component))\n",
+    "        logger.end_log_level()\n",
+    "        \n",
+    "        display(df_extracted.head())\n",
+    "        \n",
+    "        logger.log(\"Transforming... {}\".format(df_extracted.shape))\n",
+    "        transform_pipeline.set_params(add_level__level_val=component)\n",
+    "        df_transformed = transform_pipeline.transform(df_extracted)\n",
+    "        utils.save_df(df_transformed,hdf5_fname,'transformed/{}'.format(component))\n",
+    "\n",
+    "        display(df_transformed.head())\n",
+    "\n",
+    "        display(df_transformed.describe())\n",
+    "\n",
+    "        print utils.data_loss(df_extracted.set_index('id').value.to_frame(),df_transformed)\n",
+    "        \n",
+    "        logger.log(\"Cleaning... {}\".format(df_transformed.shape))       \n",
+    "        df_cleaned = standard_clean_pipeline.transform(df_transformed)\n",
+    "        utils.save_df(df_cleaned,hdf5_fname,'cleaned/{}'.format(component))\n",
+    "        \n",
+    "        display(df_cleaned.head())\n",
+    "\n",
+    "        display(df_cleaned.describe())\n",
+    "\n",
+    "        print utils.data_loss(df_extracted.set_index('id').value.to_frame(),df_cleaned)\n",
+    "        \n",
+    "        del df_cleaned,df_transformed,df_extracted\n",
+    "        logger.end_log_level()\n",
+    "        \n",
+    "        \n",
+    "    \n",
+    "    logger.end_log()\n",
+    "    \n",
+    "    return\n",
+    "           \n",
+    "\n",
+    "def mimic_features(hdf5_fname,specific_path,labels,\n",
+    "                   custom_cleaners,segmenter,feature_tuples):\n",
+    "    \n",
+    "    \n",
+    "    df_all = None\n",
+    "    \n",
+    "    for label in labels:\n",
+    "        df_base = utils.open_df(hdf5_fname,'cleaned/{}'.format(label))\n",
+    "        \n",
+    "        df_cleaned = custom_cleaners.transform(df_base)\n",
+    "        utils.save_df(df_cleaned,hdf5_fname,'{}/cleaned/{}'.format(specific_path,label))\n",
+    "            \n",
+    "        if df_all is None:\n",
+    "            df_all = df_cleaned\n",
+    "        else:\n",
+    "            df_all = df_all.join(df_cleaned,how='outer')\n",
+    "            del df_cleaned\n",
+    "        \n",
+    "    utils.save_df(df_all,hdf5_fname,'{}/cleaned/all')\n",
+    "            \n",
+    "    df_segmented = segmenter.transform(df_all)\n",
+    "    utils.save_df(df_segmented,hdf5_fname_target,'{}/segmented'.format(specific_path))\n",
+    "    del df_all\n",
+    "    \n",
+    "    mapped_ft = features.make_mapper(feature_tuples,df_segmented)\n",
+    "    df_features = mapped_ft.transform(df_segmented)\n",
+    "    utils.save_df(df_features,hdf5_fname_target,'{}/features'.format(specific_path))\n",
+    "    del df_segmented\n",
+    "    \n",
+    "    return df_features"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "def do_ETL(data_dict,components,tag,n,seed=42):\n",
+    "    hdf5_fname = 'data/mimic_{}_{}'.format(tag,n)\n",
+    "    hadm_ids = n if n == constants.ALL else mimic.sample_hadm_ids(n,seed) \n",
+    "    mimic_ETL(components,data_dict,hdf5_fname,hadm_ids=hadm_ids)\n",
+    "    return hdf5_fname"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "reload(logger)\n",
+    "\n",
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n",
+    "components = data_dict.get_panel_defintions(12).component.unique().tolist() #12 is \"simple data\"\n",
+    "tag = 'simple'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-20 10:03:09) BEGIN ETL for 1000 admissions\n",
+      "(2017-06-20 10:03:09)>> Extract CONTEXT...\n",
+      "(2017-06-20 10:03:17)<< DONE (8.0s)\n",
+      "(2017-06-20 10:03:17)>> BLOOD PRESSURE SYSTOLIC\n",
+      "(2017-06-20 10:03:17)>>>> Extracting...\n",
+      "(2017-06-20 10:03:17)>>>>>> Extracting 14 items from chartevents\n",
+      "51        35823\n",
+      "455       26680\n",
+      "220179    21957\n",
+      "220050    15186\n",
+      "3313       2250\n",
+      "225309     1251\n",
+      "3315         50\n",
+      "3317         24\n",
+      "3323         21\n",
+      "442          19\n",
+      "3321         19\n",
+      "224167       12\n",
+      "227243        8\n",
+      "Name: itemid, dtype: int64\n",
+      "Empty DataFrame\n",
+      "Columns: [id, datetime, value, units, itemid]\n",
+      "Index: []\n",
+      "(2017-06-20 10:04:09)<<<<<< DONE (52.0s)\n",
+      "(2017-06-20 10:04:09)>>>>>> Combine DF\n",
+      "(2017-06-20 10:04:09)<<<<<< DONE (0.0s)\n",
+      "(2017-06-20 10:04:09)>>>>>> Clean UOM\n",
+      "(2017-06-20 10:04:10)<<<<<< DONE (1.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th>value</th>\n",
+       "      <th>units</th>\n",
+       "      <th>itemid</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>107880</td>\n",
+       "      <td>2106-06-19 22:00:00</td>\n",
+       "      <td>99</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>107880</td>\n",
+       "      <td>2106-06-19 23:00:00</td>\n",
+       "      <td>98</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>107880</td>\n",
+       "      <td>2106-06-20 00:00:00</td>\n",
+       "      <td>122</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>107880</td>\n",
+       "      <td>2106-06-20 01:00:00</td>\n",
+       "      <td>150</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>107880</td>\n",
+       "      <td>2106-06-20 02:00:00</td>\n",
+       "      <td>133</td>\n",
+       "      <td>mmHg</td>\n",
+       "      <td>51</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       id            datetime value units  itemid\n",
+       "0  107880 2106-06-19 22:00:00    99  mmHg      51\n",
+       "1  107880 2106-06-19 23:00:00    98  mmHg      51\n",
+       "2  107880 2106-06-20 00:00:00   122  mmHg      51\n",
+       "3  107880 2106-06-20 01:00:00   150  mmHg      51\n",
+       "4  107880 2106-06-20 02:00:00   133  mmHg      51"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-20 10:04:10)<<<< DONE (53.0s)\n",
+      "(2017-06-20 10:04:10)>>>> Transforming... (103300, 5)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>component</th>\n",
+       "      <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th>cc/min</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">mmHg</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">cc/min</th>\n",
+       "      <th colspan=\"3\" halign=\"left\">mmHg</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>3313</th>\n",
+       "      <th>455</th>\n",
+       "      <th>51</th>\n",
+       "      <th>220179</th>\n",
+       "      <th>442</th>\n",
+       "      <th>220050</th>\n",
+       "      <th>3315</th>\n",
+       "      <th>3317</th>\n",
+       "      <th>3321</th>\n",
+       "      <th>3323</th>\n",
+       "      <th>224167</th>\n",
+       "      <th>227243</th>\n",
+       "      <th>225309</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100304</th>\n",
+       "      <th>2161-10-01 22:00:00</th>\n",
+       "      <td>67</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2161-10-01 23:00:00</th>\n",
+       "      <td>68</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100788</th>\n",
+       "      <th>2120-04-10 14:00:00</th>\n",
+       "      <td>None</td>\n",
+       "      <td>127</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2120-04-10 15:00:00</th>\n",
+       "      <td>None</td>\n",
+       "      <td>127</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2120-04-10 16:00:00</th>\n",
+       "      <td>None</td>\n",
+       "      <td>123</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "      <td>None</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "component                  blood pressure systolic                       \\\n",
+       "units                                       cc/min   mmHg                 \n",
+       "description                                 3313   455    51     220179   \n",
+       "id     datetime                                                           \n",
+       "100304 2161-10-01 22:00:00                      67   None   None   None   \n",
+       "       2161-10-01 23:00:00                      68   None   None   None   \n",
+       "100788 2120-04-10 14:00:00                    None    127   None   None   \n",
+       "       2120-04-10 15:00:00                    None    127   None   None   \n",
+       "       2120-04-10 16:00:00                    None    123   None   None   \n",
+       "\n",
+       "component                                                                    \\\n",
+       "units                                    cc/min                        mmHg   \n",
+       "description                442    220050 3315   3317   3321   3323   224167   \n",
+       "id     datetime                                                               \n",
+       "100304 2161-10-01 22:00:00   None   None   None   None   None   None   None   \n",
+       "       2161-10-01 23:00:00   None   None   None   None   None   None   None   \n",
+       "100788 2120-04-10 14:00:00   None   None   None   None   None   None   None   \n",
+       "       2120-04-10 15:00:00   None   None   None   None   None   None   None   \n",
+       "       2120-04-10 16:00:00   None   None   None   None   None   None   None   \n",
+       "\n",
+       "component                                 \n",
+       "units                                     \n",
+       "description                227243 225309  \n",
+       "id     datetime                           \n",
+       "100304 2161-10-01 22:00:00   None   None  \n",
+       "       2161-10-01 23:00:00   None   None  \n",
+       "100788 2120-04-10 14:00:00   None   None  \n",
+       "       2120-04-10 15:00:00   None   None  \n",
+       "       2120-04-10 16:00:00   None   None  "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>component</th>\n",
+       "      <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th>cc/min</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">mmHg</th>\n",
+       "      <th colspan=\"4\" halign=\"left\">cc/min</th>\n",
+       "      <th colspan=\"3\" halign=\"left\">mmHg</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>3313</th>\n",
+       "      <th>455</th>\n",
+       "      <th>51</th>\n",
+       "      <th>220179</th>\n",
+       "      <th>442</th>\n",
+       "      <th>220050</th>\n",
+       "      <th>3315</th>\n",
+       "      <th>3317</th>\n",
+       "      <th>3321</th>\n",
+       "      <th>3323</th>\n",
+       "      <th>224167</th>\n",
+       "      <th>227243</th>\n",
+       "      <th>225309</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>2241</td>\n",
+       "      <td>26480</td>\n",
+       "      <td>35622</td>\n",
+       "      <td>21957</td>\n",
+       "      <td>17</td>\n",
+       "      <td>15186</td>\n",
+       "      <td>22</td>\n",
+       "      <td>16</td>\n",
+       "      <td>13</td>\n",
+       "      <td>14</td>\n",
+       "      <td>12</td>\n",
+       "      <td>8</td>\n",
+       "      <td>1251</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unique</th>\n",
+       "      <td>81</td>\n",
+       "      <td>181</td>\n",
+       "      <td>208</td>\n",
+       "      <td>176</td>\n",
+       "      <td>14</td>\n",
+       "      <td>172</td>\n",
+       "      <td>21</td>\n",
+       "      <td>13</td>\n",
+       "      <td>12</td>\n",
+       "      <td>11</td>\n",
+       "      <td>9</td>\n",
+       "      <td>8</td>\n",
+       "      <td>126</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>top</th>\n",
+       "      <td>72</td>\n",
+       "      <td>106</td>\n",
+       "      <td>108</td>\n",
+       "      <td>112</td>\n",
+       "      <td>122</td>\n",
+       "      <td>120</td>\n",
+       "      <td>89</td>\n",
+       "      <td>74</td>\n",
+       "      <td>66</td>\n",
+       "      <td>80</td>\n",
+       "      <td>102</td>\n",
+       "      <td>110</td>\n",
+       "      <td>107</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>freq</th>\n",
+       "      <td>91</td>\n",
+       "      <td>494</td>\n",
+       "      <td>641</td>\n",
+       "      <td>457</td>\n",
+       "      <td>2</td>\n",
+       "      <td>296</td>\n",
+       "      <td>2</td>\n",
+       "      <td>2</td>\n",
+       "      <td>2</td>\n",
+       "      <td>2</td>\n",
+       "      <td>4</td>\n",
+       "      <td>1</td>\n",
+       "      <td>41</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "component   blood pressure systolic                                            \\\n",
+       "units                        cc/min   mmHg                             cc/min   \n",
+       "description                  3313   455    51     220179 442    220050 3315     \n",
+       "count                          2241  26480  35622  21957     17  15186     22   \n",
+       "unique                           81    181    208    176     14    172     21   \n",
+       "top                              72    106    108    112    122    120     89   \n",
+       "freq                             91    494    641    457      2    296      2   \n",
+       "\n",
+       "component                                              \n",
+       "units                              mmHg                \n",
+       "description 3317   3321   3323   224167 227243 225309  \n",
+       "count           16     13     14     12      8   1251  \n",
+       "unique          13     12     11      9      8    126  \n",
+       "top             74     66     80    102    110    107  \n",
+       "freq             2      2      2      4      1     41  "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "((103300, 1), (97535, 13), 461L, 2, '0.2094% records')\n",
+      "(2017-06-20 10:04:12)<<<< DONE (2.0s)\n",
+      "(2017-06-20 10:04:12)>>>> Cleaning... (97535, 13)\n",
+      "(2017-06-20 10:04:14)<<<< DONE (2.0s)\n",
+      "(2017-06-20 10:04:14)>>>> Nominal to OneHot\n",
+      "(2017-06-20 10:04:14)<<<< DONE (0.0s)\n",
+      "(2017-06-20 10:04:14)>>>> Drop OOB data | (97527, 13)\n",
+      "(2017-06-20 10:04:14)>>>>>> blood pressure systolic, mmHg, 100525\n",
+      "(2017-06-20 10:04:19)<<<<<< DONE (5.0s)\n",
+      "(2017-06-20 10:04:19)>>>>>> blood pressure systolic, cc/min, 2306\n",
+      "(2017-06-20 10:04:19)<<<<<< DONE (0.0s)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>component</th>\n",
+       "      <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">mmHg</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">cc/min</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th>description</th>\n",
+       "      <th>220050</th>\n",
+       "      <th>220179</th>\n",
+       "      <th>224167</th>\n",
+       "      <th>225309</th>\n",
+       "      <th>227243</th>\n",
+       "      <th>442</th>\n",
+       "      <th>455</th>\n",
+       "      <th>51</th>\n",
+       "      <th>3313</th>\n",
+       "      <th>3315</th>\n",
+       "      <th>3317</th>\n",
+       "      <th>3321</th>\n",
+       "      <th>3323</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>id</th>\n",
+       "      <th>datetime</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"2\" valign=\"top\">100304</th>\n",
+       "      <th>2161-10-01 22:00:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>67.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2161-10-01 23:00:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>68.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">100788</th>\n",
+       "      <th>2120-04-10 14:00:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>127.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2120-04-10 15:00:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>127.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2120-04-10 16:00:00</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>123.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "component                  blood pressure systolic                       \\\n",
+       "status                                       known                        \n",
+       "variable_type                                   qn                        \n",
+       "units                                         mmHg                        \n",
+       "description                                 220050 220179 224167 225309   \n",
+       "id     datetime                                                           \n",
+       "100304 2161-10-01 22:00:00                     NaN    NaN    NaN    NaN   \n",
+       "       2161-10-01 23:00:00                     NaN    NaN    NaN    NaN   \n",
+       "100788 2120-04-10 14:00:00                     NaN    NaN    NaN    NaN   \n",
+       "       2120-04-10 15:00:00                     NaN    NaN    NaN    NaN   \n",
+       "       2120-04-10 16:00:00                     NaN    NaN    NaN    NaN   \n",
+       "\n",
+       "component                                                                     \n",
+       "status                                           unknown                      \n",
+       "variable_type                                         qn                      \n",
+       "units                                             cc/min                      \n",
+       "description                227243 442    455  51    3313 3315 3317 3321 3323  \n",
+       "id     datetime                                                               \n",
+       "100304 2161-10-01 22:00:00    NaN NaN    NaN NaN    67.0  NaN  NaN  NaN  NaN  \n",
+       "       2161-10-01 23:00:00    NaN NaN    NaN NaN    68.0  NaN  NaN  NaN  NaN  \n",
+       "100788 2120-04-10 14:00:00    NaN NaN  127.0 NaN     NaN  NaN  NaN  NaN  NaN  \n",
+       "       2120-04-10 15:00:00    NaN NaN  127.0 NaN     NaN  NaN  NaN  NaN  NaN  \n",
+       "       2120-04-10 16:00:00    NaN NaN  123.0 NaN     NaN  NaN  NaN  NaN  NaN  "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th>component</th>\n",
+       "      <th colspan=\"13\" halign=\"left\">blood pressure systolic</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>status</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">known</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">unknown</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>variable_type</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">qn</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">qn</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>units</th>\n",
+       "      <th colspan=\"8\" halign=\"left\">mmHg</th>\n",
+       "      <th colspan=\"5\" halign=\"left\">cc/min</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>description</th>\n",
+       "      <th>220050</th>\n",
+       "      <th>220179</th>\n",
+       "      <th>224167</th>\n",
+       "      <th>225309</th>\n",
+       "      <th>227243</th>\n",
+       "      <th>442</th>\n",
+       "      <th>455</th>\n",
+       "      <th>51</th>\n",
+       "      <th>3313</th>\n",
+       "      <th>3315</th>\n",
+       "      <th>3317</th>\n",
+       "      <th>3321</th>\n",
+       "      <th>3323</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>count</th>\n",
+       "      <td>15186.000000</td>\n",
+       "      <td>21957.000000</td>\n",
+       "      <td>12.000000</td>\n",
+       "      <td>1251.000000</td>\n",
+       "      <td>8.00000</td>\n",
+       "      <td>17.000000</td>\n",
+       "      <td>26478.000000</td>\n",
+       "      <td>35616.000000</td>\n",
+       "      <td>2241.000000</td>\n",
+       "      <td>22.000000</td>\n",
+       "      <td>16.00000</td>\n",
+       "      <td>13.000000</td>\n",
+       "      <td>14.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>mean</th>\n",
+       "      <td>118.988213</td>\n",
+       "      <td>119.200483</td>\n",
+       "      <td>104.416667</td>\n",
+       "      <td>110.457234</td>\n",
+       "      <td>111.87500</td>\n",
+       "      <td>122.882353</td>\n",
+       "      <td>119.150623</td>\n",
+       "      <td>121.264628</td>\n",
+       "      <td>70.371709</td>\n",
+       "      <td>77.727273</td>\n",
+       "      <td>76.68750</td>\n",
+       "      <td>77.846154</td>\n",
+       "      <td>75.714286</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>std</th>\n",
+       "      <td>23.366007</td>\n",
+       "      <td>21.757748</td>\n",
+       "      <td>15.559027</td>\n",
+       "      <td>20.465707</td>\n",
+       "      <td>19.05209</td>\n",
+       "      <td>31.262762</td>\n",
+       "      <td>23.206573</td>\n",
+       "      <td>25.927916</td>\n",
+       "      <td>12.969975</td>\n",
+       "      <td>15.495566</td>\n",
+       "      <td>17.72651</td>\n",
+       "      <td>14.932326</td>\n",
+       "      <td>14.514865</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>min</th>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>33.000000</td>\n",
+       "      <td>86.000000</td>\n",
+       "      <td>23.000000</td>\n",
+       "      <td>84.00000</td>\n",
+       "      <td>70.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>38.000000</td>\n",
+       "      <td>54.000000</td>\n",
+       "      <td>50.00000</td>\n",
+       "      <td>58.000000</td>\n",
+       "      <td>55.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>25%</th>\n",
+       "      <td>103.000000</td>\n",
+       "      <td>104.000000</td>\n",
+       "      <td>97.500000</td>\n",
+       "      <td>99.000000</td>\n",
+       "      <td>97.25000</td>\n",
+       "      <td>96.000000</td>\n",
+       "      <td>102.000000</td>\n",
+       "      <td>104.000000</td>\n",
+       "      <td>61.000000</td>\n",
+       "      <td>66.250000</td>\n",
+       "      <td>62.75000</td>\n",
+       "      <td>67.000000</td>\n",
+       "      <td>66.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>50%</th>\n",
+       "      <td>117.000000</td>\n",
+       "      <td>117.000000</td>\n",
+       "      <td>102.000000</td>\n",
+       "      <td>108.000000</td>\n",
+       "      <td>116.00000</td>\n",
+       "      <td>125.000000</td>\n",
+       "      <td>117.000000</td>\n",
+       "      <td>119.000000</td>\n",
+       "      <td>70.000000</td>\n",
+       "      <td>76.000000</td>\n",
+       "      <td>76.00000</td>\n",
+       "      <td>75.000000</td>\n",
+       "      <td>75.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>75%</th>\n",
+       "      <td>133.000000</td>\n",
+       "      <td>133.000000</td>\n",
+       "      <td>104.000000</td>\n",
+       "      <td>120.000000</td>\n",
+       "      <td>128.50000</td>\n",
+       "      <td>138.000000</td>\n",
+       "      <td>135.000000</td>\n",
+       "      <td>137.000000</td>\n",
+       "      <td>77.000000</td>\n",
+       "      <td>86.750000</td>\n",
+       "      <td>86.00000</td>\n",
+       "      <td>84.000000</td>\n",
+       "      <td>80.000000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>max</th>\n",
+       "      <td>244.000000</td>\n",
+       "      <td>247.000000</td>\n",
+       "      <td>144.000000</td>\n",
+       "      <td>273.000000</td>\n",
+       "      <td>132.00000</td>\n",
+       "      <td>174.000000</td>\n",
+       "      <td>234.000000</td>\n",
+       "      <td>284.000000</td>\n",
+       "      <td>123.000000</td>\n",
+       "      <td>112.000000</td>\n",
+       "      <td>120.00000</td>\n",
+       "      <td>108.000000</td>\n",
+       "      <td>99.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "component     blood pressure systolic                                         \\\n",
+       "status                          known                                          \n",
+       "variable_type                      qn                                          \n",
+       "units                            mmHg                                          \n",
+       "description                    220050        220179      224167       225309   \n",
+       "count                    15186.000000  21957.000000   12.000000  1251.000000   \n",
+       "mean                       118.988213    119.200483  104.416667   110.457234   \n",
+       "std                         23.366007     21.757748   15.559027    20.465707   \n",
+       "min                          0.000000     33.000000   86.000000    23.000000   \n",
+       "25%                        103.000000    104.000000   97.500000    99.000000   \n",
+       "50%                        117.000000    117.000000  102.000000   108.000000   \n",
+       "75%                        133.000000    133.000000  104.000000   120.000000   \n",
+       "max                        244.000000    247.000000  144.000000   273.000000   \n",
+       "\n",
+       "component                                                                      \\\n",
+       "status                                                                unknown   \n",
+       "variable_type                                                              qn   \n",
+       "units                                                                  cc/min   \n",
+       "description       227243         442           455            51         3313   \n",
+       "count            8.00000   17.000000  26478.000000  35616.000000  2241.000000   \n",
+       "mean           111.87500  122.882353    119.150623    121.264628    70.371709   \n",
+       "std             19.05209   31.262762     23.206573     25.927916    12.969975   \n",
+       "min             84.00000   70.000000      0.000000      0.000000    38.000000   \n",
+       "25%             97.25000   96.000000    102.000000    104.000000    61.000000   \n",
+       "50%            116.00000  125.000000    117.000000    119.000000    70.000000   \n",
+       "75%            128.50000  138.000000    135.000000    137.000000    77.000000   \n",
+       "max            132.00000  174.000000    234.000000    284.000000   123.000000   \n",
+       "\n",
+       "component                                                    \n",
+       "status                                                       \n",
+       "variable_type                                                \n",
+       "units                                                        \n",
+       "description          3315       3317        3321       3323  \n",
+       "count           22.000000   16.00000   13.000000  14.000000  \n",
+       "mean            77.727273   76.68750   77.846154  75.714286  \n",
+       "std             15.495566   17.72651   14.932326  14.514865  \n",
+       "min             54.000000   50.00000   58.000000  55.000000  \n",
+       "25%             66.250000   62.75000   67.000000  66.000000  \n",
+       "50%             76.000000   76.00000   75.000000  75.500000  \n",
+       "75%             86.750000   86.00000   84.000000  80.000000  \n",
+       "max            112.000000  120.00000  108.000000  99.000000  "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "((103300, 1), (97527, 13), 469L, 2, '0.2094% records')\n",
+      "(2017-06-20 10:04:19)<<<< DONE (5.0s)\n",
+      "(2017-06-20 10:04:19)<< DONE (62.0s)\n",
+      "(2017-06-20 10:04:19) DONE (70.0s)\n"
+     ]
+    }
+   ],
+   "source": [
+    "n = 100\n",
+    "hdf5_fname = do_ETL(data_dict,[data_dict.components.BLOOD_PRESSURE_SYSTOLIC],tag,n)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 44,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-06-20 10:09:14) BEGIN ETL for all admissions\n",
+      "(2017-06-20 10:09:15)>> Extract CONTEXT...\n",
+      "(2017-06-20 10:09:27)<< DONE (12.0s)\n",
+      "(2017-06-20 10:09:27)>> BLOOD PRESSURE SYSTOLIC\n",
+      "(2017-06-20 10:09:27)>>>> Extracting...\n",
+      "(2017-06-20 10:09:28)>>>>>> Extracting 14 items from chartevents\n",
+      "51        2099353\n",
+      "455       1586769\n",
+      "220179    1290488\n",
+      "220050    1149788\n",
+      "3313       148105\n",
+      "225309      86557\n",
+      "3315         3762\n",
+      "442          2565\n",
+      "3317         2052\n",
+      "3323         2039\n",
+      "3321         2032\n",
+      "224167        740\n",
+      "227243        541\n",
+      "6              33\n",
+      "Name: itemid, dtype: int64\n",
+      "              id            datetime   value units  itemid\n",
+      "963709  136796.0 2139-10-06 21:00:00  113/55             6\n",
+      "963711  136796.0 2139-10-06 22:00:00  126/58             6\n",
+      "963713  136796.0 2139-10-06 23:00:00  139/64             6\n",
+      "964245  136796.0 2139-10-07 07:00:00  132/59             6\n",
+      "964247  136796.0 2139-10-07 08:00:00  143/63             6\n",
+      "964301  136796.0 2139-10-07 16:00:00  152/68             6\n",
+      "964304  136796.0 2139-10-07 18:00:00  141/59             6\n",
+      "964710  136796.0 2139-10-07 09:00:00  133/59             6\n",
+      "964743  136796.0 2139-10-07 10:00:00  131/60             6\n",
+      "965088  136796.0 2139-10-07 11:00:00  123/54             6\n",
+      "965090  136796.0 2139-10-07 12:00:00  185/79             6\n",
+      "965092  136796.0 2139-10-07 13:00:00  116/54             6\n",
+      "965094  136796.0 2139-10-07 14:00:00  122/57             6\n",
+      "965096  136796.0 2139-10-07 15:00:00  120/56             6\n",
+      "965438  136796.0 2139-10-06 13:00:00  122/55             6\n",
+      "965440  136796.0 2139-10-06 14:00:00  110/56             6\n",
+      "965854  136796.0 2139-10-06 18:00:00  108/56             6\n",
+      "965856  136796.0 2139-10-06 20:00:00  115/56             6\n",
+      "966407  136796.0 2139-10-07 03:00:00  129/57             6\n",
+      "966409  136796.0 2139-10-07 04:00:00  121/55             6\n",
+      "966411  136796.0 2139-10-07 05:00:00  125/56             6\n",
+      "968122  136796.0 2139-10-06 09:00:00  119/55             6\n",
+      "968125  136796.0 2139-10-06 12:00:00  113/60             6\n",
+      "968615  136796.0 2139-10-07 00:00:00  120/54             6\n",
+      "968617  136796.0 2139-10-07 01:00:00  130/58             6\n",
+      "968619  136796.0 2139-10-07 02:00:00  124/56             6\n"
+     ]
+    },
+    {
+     "ename": "KeyError",
+     "evalue": "0L",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
+      "\u001b[1;32m<ipython-input-44-88e79271be02>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[0mn\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mconstants\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mALL\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mhdf5_fname\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdo_ETL\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mBLOOD_PRESSURE_SYSTOLIC\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'bp'\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mn\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
+      "\u001b[1;32m<ipython-input-37-093e315c4cfe>\u001b[0m in \u001b[0;36mdo_ETL\u001b[1;34m(data_dict, components, tag, n, seed)\u001b[0m\n\u001b[0;32m      2\u001b[0m     \u001b[0mhdf5_fname\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'data/mimic_{}_{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mtag\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mn\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      3\u001b[0m     \u001b[0mhadm_ids\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mn\u001b[0m \u001b[1;32mif\u001b[0m \u001b[0mn\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mconstants\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mALL\u001b[0m \u001b[1;32melse\u001b[0m \u001b[0mmimic\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msample_hadm_ids\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mn\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mseed\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 4\u001b[1;33m     \u001b[0mmimic_ETL\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      5\u001b[0m     \u001b[1;32mreturn\u001b[0m \u001b[0mhdf5_fname\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32m<ipython-input-36-1619d6fa19c9>\u001b[0m in \u001b[0;36mmimic_ETL\u001b[1;34m(components, data_dict, hdf5_fname, hadm_ids, agg_func)\u001b[0m\n\u001b[0;32m     35\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     36\u001b[0m         \u001b[0mlogger\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mlog\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m\"Extracting...\"\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mnew_level\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 37\u001b[1;33m         \u001b[0mdf_extracted\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mextractor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mextract_component\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     38\u001b[0m         \u001b[0mutils\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msave_df\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdf_extracted\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhdf5_fname\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'extracted/{}'\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mformat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     39\u001b[0m         \u001b[0mlogger\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mend_log_level\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\mimic.py\u001b[0m in \u001b[0;36mextract_component\u001b[1;34m(self, component, hadm_ids)\u001b[0m\n\u001b[0;32m     95\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     96\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mextract_component\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mALL\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 97\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mextract_component\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mconn\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcomponent\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mitem_map\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mdata_dict\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mhadm_ids\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     98\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     99\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\icu_ml_project\\v5\\mimic.py\u001b[0m in \u001b[0;36mextract_component\u001b[1;34m(mimic_conn, component, item_map, data_dict, hadm_ids)\u001b[0m\n\u001b[0;32m    132\u001b[0m                 \u001b[1;32mif\u001b[0m \u001b[0mbp_slice\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m!=\u001b[0m \u001b[1;36m0\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    133\u001b[0m                     \u001b[1;32mif\u001b[0m \u001b[0mcomponent\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdata_dict\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mBLOOD_PRESSURE_SYSTOLIC\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 134\u001b[1;33m                         \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mis_item_6\u001b[0m \u001b[1;33m&\u001b[0m \u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mis_item_6\u001b[0m \u001b[1;33m&\u001b[0m \u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mstr\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'/'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mastype\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mint\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    135\u001b[0m                     \u001b[1;32melif\u001b[0m \u001b[0mcomponent\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdata_dict\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcomponents\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mBLOOD_PRESSURE_DIASTOLIC\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    136\u001b[0m                         \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mdf\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mhas_slash\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;34m'value'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mstr\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'/'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m1\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mastype\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mint\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\core\\series.pyc\u001b[0m in \u001b[0;36m__getitem__\u001b[1;34m(self, key)\u001b[0m\n\u001b[0;32m    599\u001b[0m         \u001b[0mkey\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mcom\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0m_apply_if_callable\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    600\u001b[0m         \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 601\u001b[1;33m             \u001b[0mresult\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget_value\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    602\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    603\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[1;32mnot\u001b[0m \u001b[0mis_scalar\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresult\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mC:\\Users\\genkinjz\\AppData\\Local\\Continuum\\Anaconda2\\lib\\site-packages\\pandas\\indexes\\base.pyc\u001b[0m in \u001b[0;36mget_value\u001b[1;34m(self, series, key)\u001b[0m\n\u001b[0;32m   2137\u001b[0m         \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2138\u001b[0m             return self._engine.get_value(s, k,\n\u001b[1;32m-> 2139\u001b[1;33m                                           tz=getattr(series.dtype, 'tz', None))\n\u001b[0m\u001b[0;32m   2140\u001b[0m         \u001b[1;32mexcept\u001b[0m \u001b[0mKeyError\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0me1\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m   2141\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mlen\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;33m>\u001b[0m \u001b[1;36m0\u001b[0m \u001b[1;32mand\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0minferred_type\u001b[0m \u001b[1;32min\u001b[0m \u001b[1;33m[\u001b[0m\u001b[1;34m'integer'\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;34m'boolean'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;32mpandas\\index.pyx\u001b[0m in \u001b[0;36mpandas.index.IndexEngine.get_value (pandas\\index.c:3338)\u001b[1;34m()\u001b[0m\n",
+      "\u001b[1;32mpandas\\index.pyx\u001b[0m in \u001b[0;36mpandas.index.IndexEngine.get_value (pandas\\index.c:3041)\u001b[1;34m()\u001b[0m\n",
+      "\u001b[1;32mpandas\\index.pyx\u001b[0m in \u001b[0;36mpandas.index.IndexEngine.get_loc (pandas\\index.c:4024)\u001b[1;34m()\u001b[0m\n",
+      "\u001b[1;32mpandas\\src\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas.hashtable.Int64HashTable.get_item (pandas\\hashtable.c:8141)\u001b[1;34m()\u001b[0m\n",
+      "\u001b[1;32mpandas\\src\\hashtable_class_helper.pxi\u001b[0m in \u001b[0;36mpandas.hashtable.Int64HashTable.get_item (pandas\\hashtable.c:8085)\u001b[1;34m()\u001b[0m\n",
+      "\u001b[1;31mKeyError\u001b[0m: 0L"
+     ]
+    }
+   ],
+   "source": [
+    "n = constants.ALL\n",
+    "hdf5_fname = do_ETL(data_dict,[data_dict.components.BLOOD_PRESSURE_SYSTOLIC],'bp',n)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 35,
+   "metadata": {
+    "collapsed": false,
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<class 'pandas.io.pytables.HDFStore'>\n",
+       "File path: data/mimic_simple_all\n",
+       "/cleaned/blood pressure diastolic                        frame                            \n",
+       "/cleaned/blood pressure mean                             frame                            \n",
+       "/cleaned/blood pressure systolic                         frame                            \n",
+       "/cleaned/glasgow coma scale eye opening                  frame                            \n",
+       "/cleaned/glasgow coma scale motor                        frame                            \n",
+       "/cleaned/glasgow coma scale verbal                       frame                            \n",
+       "/cleaned/heart rate                                      frame                            \n",
+       "/cleaned/hemoglobin                                      frame                            \n",
+       "/cleaned/lactate                                         frame                            \n",
+       "/cleaned/lactated ringers                                frame                            \n",
+       "/cleaned/norepinephrine                                  frame                            \n",
+       "/cleaned/normal saline                                   frame                            \n",
+       "/cleaned/output urine                                    frame                            \n",
+       "/cleaned/oxygen saturation pulse oximetry                frame                            \n",
+       "/cleaned/respiratory rate                                frame                            \n",
+       "/cleaned/temperature body                                frame                            \n",
+       "/cleaned/vasopressin                                     frame                            \n",
+       "/cleaned/weight body                                     frame                            \n",
+       "/context                                                 frame        (shape->[62722,22]) \n",
+       "/extracted/blood pressure diastolic                      frame        (shape->[6371249,5])\n",
+       "/extracted/blood pressure mean                           frame        (shape->[2536271,5])\n",
+       "/extracted/blood pressure systolic                       frame        (shape->[6374824,5])\n",
+       "/extracted/glasgow coma scale eye opening                frame        (shape->[956672,5]) \n",
+       "/extracted/glasgow coma scale motor                      frame        (shape->[952565,5]) \n",
+       "/extracted/glasgow coma scale verbal                     frame        (shape->[954700,5]) \n",
+       "/extracted/heart rate                                    frame        (shape->[7952939,5])\n",
+       "/extracted/hemoglobin                                    frame        (shape->[1167921,5])\n",
+       "/extracted/lactate                                       frame        (shape->[393608,5]) \n",
+       "/extracted/lactated ringers                              frame        (shape->[504306,5]) \n",
+       "/extracted/norepinephrine                                frame        (shape->[1136938,5])\n",
+       "/extracted/normal saline                                 frame        (shape->[817373,5]) \n",
+       "/extracted/output urine                                  frame        (shape->[3644639,5])\n",
+       "/extracted/oxygen saturation pulse oximetry              frame        (shape->[6099827,5])\n",
+       "/extracted/respiratory rate                              frame        (shape->[7810019,5])\n",
+       "/extracted/temperature body                              frame        (shape->[1751447,5])\n",
+       "/extracted/vasopressin                                   frame        (shape->[339184,5]) \n",
+       "/extracted/weight body                                   frame        (shape->[95425,5])  \n",
+       "/transformed/blood pressure diastolic                    frame                            \n",
+       "/transformed/blood pressure mean                         frame                            \n",
+       "/transformed/blood pressure systolic                     frame                            \n",
+       "/transformed/glasgow coma scale eye opening              frame                            \n",
+       "/transformed/glasgow coma scale motor                    frame                            \n",
+       "/transformed/glasgow coma scale verbal                   frame                            \n",
+       "/transformed/heart rate                                  frame                            \n",
+       "/transformed/hemoglobin                                  frame                            \n",
+       "/transformed/lactate                                     frame                            \n",
+       "/transformed/lactated ringers                            frame                            \n",
+       "/transformed/norepinephrine                              frame                            \n",
+       "/transformed/normal saline                               frame                            \n",
+       "/transformed/output urine                                frame                            \n",
+       "/transformed/oxygen saturation pulse oximetry            frame                            \n",
+       "/transformed/respiratory rate                            frame                            \n",
+       "/transformed/temperature body                            frame                            \n",
+       "/transformed/vasopressin                                 frame                            \n",
+       "/transformed/weight body                                 frame                            "
+      ]
+     },
+     "execution_count": 35,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "store = pd.HDFStore(hdf5_fname)\n",
+    "store"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 36,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "store.close()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import utils\n",
+    "import mimic\n",
+    "import icu_data_defs\n",
+    "import transformers"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')\n",
+    "components = data_dict.get_panel_defintions(1).component.unique().tolist() #1 is vitals"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[u'heart rate',\n",
+       " u'blood pressure systolic',\n",
+       " u'blood pressure diastolic',\n",
+       " u'blood pressure mean',\n",
+       " u'respiratory rate',\n",
+       " u'temperature body',\n",
+       " u'oxygen saturation pulse oximetry',\n",
+       " u'weight body']"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "components"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(2017-07-04 22:28:15)<<<<<<<< --- (25.0s)\n",
+      "(2017-07-04 22:28:15)>>>>>>>> ***ETL***\n",
+      "(2017-07-04 22:28:15)>>>>>>>>>> SETUP\n",
+      "(2017-07-04 22:28:15)<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:28:15)>>>>>>>>>> BEGIN ETL for all admissions and 8 components: [u'heart rate', u'blood pressure systolic', u'blood pressure diastolic', u'blood pressure mean', u'respiratory rate', u'temperature body', u'oxygen saturation pulse oximetry', u'weight body']\n",
+      "(2017-07-04 22:28:15)>>>>>>>>>>>> HEART RATE: 1/8\n",
+      "(2017-07-04 22:28:15)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 22:28:16)>>>>>>>>>>>>>>>> Extracting 5 items from chartevents\n",
+      "(2017-07-04 22:29:12)<<<<<<<<<<<<<<<< --- (56.0s)\n",
+      "(2017-07-04 22:29:12)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 22:29:13)<<<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 22:29:13)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 22:29:33)<<<<<<<<<<<<<<<< --- (20.0s)\n",
+      "(2017-07-04 22:29:33)<<<<<<<<<<<<<< --- (78.0s)\n",
+      "(2017-07-04 22:29:33)>>>>>>>>>>>>>> Transforming... (7952939, 5)\n",
+      "Data Loss (Extract > Transformed): ((7952939, 1), (7923711, 6), 29066L, 171, '0.3015% records')\n",
+      "(2017-07-04 22:31:25)<<<<<<<<<<<<<< --- (112.0s)\n",
+      "(2017-07-04 22:31:25)>>>>>>>>>>>>>> Cleaning... (7923711, 6)\n",
+      "(2017-07-04 22:32:14)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 22:32:14)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:32:14)>>>>>>>>>>>>>>>> Drop OOB data | (7922986, 6)\n",
+      "(2017-07-04 22:32:18)>>>>>>>>>>>>>>>>>> heart rate, beats/min, 7923117\n",
+      "(2017-07-04 22:33:29)<<<<<<<<<<<<<<<<<< --- (71.0s)\n",
+      "(2017-07-04 22:33:29)>>>>>>>>>>>>>>>>>> heart rate, no_units, 31\n",
+      "(2017-07-04 22:33:29)<<<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:33:29)<<<<<<<<<<<<<<<< --- (75.0s)\n",
+      "Data Loss (Extract > Cleaned): ((7952939, 1), (7922986, 6), 29804L, 171, '0.3015% records')\n",
+      "(2017-07-04 22:33:31)<<<<<<<<<<<<<< --- (126.0s)\n",
+      "(2017-07-04 22:33:31)>>>>>>>>>>>>>> Filter & sort - (7922986, 6)\n",
+      "(2017-07-04 22:33:35)<<<<<<<<<<<<<< --- (4.0s)\n",
+      "(2017-07-04 22:33:35)>>>>>>>>>>>>>> Convert to dask - (7922986, 6)\n",
+      "(2017-07-04 22:33:36)<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 22:33:36)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 22:33:36)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:33:36)<<<<<<<<<<<< --- (321.0s)\n",
+      "(2017-07-04 22:33:36)>>>>>>>>>>>> BLOOD PRESSURE SYSTOLIC: 2/8\n",
+      "(2017-07-04 22:33:36)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 22:33:36)>>>>>>>>>>>>>>>> Extracting 14 items from chartevents\n",
+      "(2017-07-04 22:35:06)<<<<<<<<<<<<<<<< --- (90.0s)\n",
+      "(2017-07-04 22:35:06)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 22:35:06)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:35:06)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 22:35:10)<<<<<<<<<<<<<<<< --- (4.0s)\n",
+      "(2017-07-04 22:35:10)<<<<<<<<<<<<<< --- (94.0s)\n",
+      "(2017-07-04 22:35:10)>>>>>>>>>>>>>> Transforming... (6374824, 5)\n",
+      "Data Loss (Extract > Transformed): ((6374824, 1), (5974719, 15), 43236L, 174, '0.307% records')\n",
+      "(2017-07-04 22:36:52)<<<<<<<<<<<<<< --- (102.0s)\n",
+      "(2017-07-04 22:36:52)>>>>>>>>>>>>>> Cleaning... (5974719, 15)\n",
+      "(2017-07-04 22:42:30)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 22:42:31)<<<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 22:42:31)>>>>>>>>>>>>>>>> Drop OOB data | (5974186, 14)\n",
+      "(2017-07-04 22:42:34)>>>>>>>>>>>>>>>>>> blood pressure systolic, mmHg, 6177439\n",
+      "(2017-07-04 22:45:18)<<<<<<<<<<<<<<<<<< --- (164.0s)\n",
+      "(2017-07-04 22:45:18)>>>>>>>>>>>>>>>>>> blood pressure systolic, cc/min, 153573\n",
+      "(2017-07-04 22:45:19)<<<<<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 22:45:19)<<<<<<<<<<<<<<<< --- (168.0s)\n",
+      "Data Loss (Extract > Cleaned): ((6374824, 1), (5974186, 14), 43848L, 174, '0.307% records')\n",
+      "(2017-07-04 22:45:20)<<<<<<<<<<<<<< --- (508.0s)\n",
+      "(2017-07-04 22:45:20)>>>>>>>>>>>>>> Filter & sort - (5974186, 14)\n",
+      "(2017-07-04 22:45:23)<<<<<<<<<<<<<< --- (3.0s)\n",
+      "(2017-07-04 22:45:23)>>>>>>>>>>>>>> Convert to dask - (5974186, 14)\n",
+      "(2017-07-04 22:45:25)<<<<<<<<<<<<<< --- (2.0s)\n",
+      "(2017-07-04 22:45:25)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 22:45:25)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:45:25)<<<<<<<<<<<< --- (709.0s)\n",
+      "(2017-07-04 22:45:25)>>>>>>>>>>>> BLOOD PRESSURE DIASTOLIC: 3/8\n",
+      "(2017-07-04 22:45:25)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 22:45:25)>>>>>>>>>>>>>>>> Extracting 16 items from chartevents\n",
+      "(2017-07-04 22:48:00)<<<<<<<<<<<<<<<< --- (155.0s)\n",
+      "(2017-07-04 22:48:00)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 22:48:00)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:48:00)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 22:48:06)<<<<<<<<<<<<<<<< --- (6.0s)\n",
+      "(2017-07-04 22:48:06)<<<<<<<<<<<<<< --- (161.0s)\n",
+      "(2017-07-04 22:48:06)>>>>>>>>>>>>>> Transforming... (6371282, 5)\n",
+      "Data Loss (Extract > Transformed): ((6371282, 1), (5976845, 17), 24410L, 170, '0.2999% records')\n",
+      "(2017-07-04 22:49:52)<<<<<<<<<<<<<< --- (106.0s)\n",
+      "(2017-07-04 22:49:52)>>>>>>>>>>>>>> Cleaning... (5976845, 17)\n",
+      "(2017-07-04 22:56:05)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 22:56:06)<<<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 22:56:06)>>>>>>>>>>>>>>>> Drop OOB data | (5976313, 16)\n",
+      "(2017-07-04 22:56:10)>>>>>>>>>>>>>>>>>> blood pressure diastolic, mmHg, 6194656\n",
+      "(2017-07-04 22:59:39)<<<<<<<<<<<<<<<<<< --- (209.0s)\n",
+      "(2017-07-04 22:59:39)>>>>>>>>>>>>>>>>>> blood pressure diastolic, cc/min, 151640\n",
+      "(2017-07-04 22:59:39)<<<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:59:39)<<<<<<<<<<<<<<<< --- (213.0s)\n",
+      "Data Loss (Extract > Cleaned): ((6371282, 1), (5976313, 16), 25238L, 170, '0.2999% records')\n",
+      "(2017-07-04 22:59:41)<<<<<<<<<<<<<< --- (589.0s)\n",
+      "(2017-07-04 22:59:41)>>>>>>>>>>>>>> Filter & sort - (5976313, 16)\n",
+      "(2017-07-04 22:59:45)<<<<<<<<<<<<<< --- (4.0s)\n",
+      "(2017-07-04 22:59:45)>>>>>>>>>>>>>> Convert to dask - (5976313, 16)\n",
+      "(2017-07-04 22:59:46)<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 22:59:46)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 22:59:46)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 22:59:46)<<<<<<<<<<<< --- (861.0s)\n",
+      "(2017-07-04 22:59:46)>>>>>>>>>>>> BLOOD PRESSURE MEAN: 4/8\n",
+      "(2017-07-04 22:59:46)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 22:59:46)>>>>>>>>>>>>>>>> Extracting 3 items from chartevents\n",
+      "(2017-07-04 23:00:18)<<<<<<<<<<<<<<<< --- (32.0s)\n",
+      "(2017-07-04 23:00:18)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 23:00:19)<<<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 23:00:19)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 23:00:20)<<<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 23:00:20)<<<<<<<<<<<<<< --- (34.0s)\n",
+      "(2017-07-04 23:00:20)>>>>>>>>>>>>>> Transforming... (2536271, 5)\n",
+      "Data Loss (Extract > Transformed): ((2536271, 1), (2416029, 3), 0L, 0, '0.0% records')\n",
+      "(2017-07-04 23:01:04)<<<<<<<<<<<<<< --- (44.0s)\n",
+      "(2017-07-04 23:01:04)>>>>>>>>>>>>>> Cleaning... (2416029, 3)\n",
+      "(2017-07-04 23:01:19)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 23:01:19)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:01:19)>>>>>>>>>>>>>>>> Drop OOB data | (2415995, 3)\n",
+      "(2017-07-04 23:01:20)>>>>>>>>>>>>>>>>>> blood pressure mean, mmHg, 2536236\n",
+      "(2017-07-04 23:01:55)<<<<<<<<<<<<<<<<<< --- (35.0s)\n",
+      "(2017-07-04 23:01:55)<<<<<<<<<<<<<<<< --- (36.0s)\n",
+      "Data Loss (Extract > Cleaned): ((2536271, 1), (2415995, 3), 1873L, 0, '0.0% records')\n",
+      "(2017-07-04 23:01:55)<<<<<<<<<<<<<< --- (51.0s)\n",
+      "(2017-07-04 23:01:55)>>>>>>>>>>>>>> Filter & sort - (2415995, 3)\n",
+      "(2017-07-04 23:01:56)<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 23:01:56)>>>>>>>>>>>>>> Convert to dask - (2415995, 3)\n",
+      "(2017-07-04 23:01:57)<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 23:01:57)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 23:01:57)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:01:57)<<<<<<<<<<<< --- (131.0s)\n",
+      "(2017-07-04 23:01:57)>>>>>>>>>>>> RESPIRATORY RATE: 5/8\n",
+      "(2017-07-04 23:01:57)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 23:01:57)>>>>>>>>>>>>>>>> Extracting 4 items from chartevents\n",
+      "(2017-07-04 23:06:09)<<<<<<<<<<<<<<<< --- (252.0s)\n",
+      "(2017-07-04 23:06:09)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 23:06:09)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:06:09)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 23:06:24)<<<<<<<<<<<<<<<< --- (15.0s)\n",
+      "(2017-07-04 23:06:24)<<<<<<<<<<<<<< --- (267.0s)\n",
+      "(2017-07-04 23:06:24)>>>>>>>>>>>>>> Transforming... (7810019, 5)\n",
+      "Data Loss (Extract > Transformed): ((7810019, 1), (7780717, 5), 28707L, 172, '0.3035% records')\n",
+      "(2017-07-04 23:08:13)<<<<<<<<<<<<<< --- (109.0s)\n",
+      "(2017-07-04 23:08:13)>>>>>>>>>>>>>> Cleaning... (7780717, 5)\n",
+      "(2017-07-04 23:11:07)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 23:11:07)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:11:07)>>>>>>>>>>>>>>>> Drop OOB data | (7780015, 4)\n",
+      "(2017-07-04 23:11:11)>>>>>>>>>>>>>>>>>> respiratory rate, insp/min, 6108262\n",
+      "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<<<< --- (57.0s)\n",
+      "(2017-07-04 23:12:08)>>>>>>>>>>>>>>>>>> respiratory rate, Breath, 1671901\n",
+      "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:12:08)>>>>>>>>>>>>>>>>>> respiratory rate, no_units, 2\n",
+      "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:12:08)<<<<<<<<<<<<<<<< --- (61.0s)\n",
+      "Data Loss (Extract > Cleaned): ((7810019, 1), (7780015, 4), 29907L, 172, '0.3035% records')\n",
+      "(2017-07-04 23:12:09)<<<<<<<<<<<<<< --- (236.0s)\n",
+      "(2017-07-04 23:12:10)>>>>>>>>>>>>>> Filter & sort - (7780015, 4)\n",
+      "(2017-07-04 23:12:14)<<<<<<<<<<<<<< --- (4.0s)\n",
+      "(2017-07-04 23:12:14)>>>>>>>>>>>>>> Convert to dask - (7780015, 4)\n",
+      "(2017-07-04 23:12:14)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:12:14)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 23:12:14)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:12:14)<<<<<<<<<<<< --- (617.0s)\n",
+      "(2017-07-04 23:12:14)>>>>>>>>>>>> TEMPERATURE BODY: 6/8\n",
+      "(2017-07-04 23:12:15)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 23:12:15)>>>>>>>>>>>>>>>> Extracting 4 items from chartevents\n",
+      "(2017-07-04 23:13:06)<<<<<<<<<<<<<<<< --- (51.0s)\n",
+      "(2017-07-04 23:13:06)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 23:13:06)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:13:06)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 23:13:11)<<<<<<<<<<<<<<<< --- (5.0s)\n",
+      "(2017-07-04 23:13:11)<<<<<<<<<<<<<< --- (56.0s)\n",
+      "(2017-07-04 23:13:11)>>>>>>>>>>>>>> Transforming... (1751447, 5)\n",
+      "Data Loss (Extract > Transformed): ((1751447, 1), (1731875, 4), 16612L, 156, '0.3189% records')\n",
+      "(2017-07-04 23:13:42)<<<<<<<<<<<<<< --- (31.0s)\n",
+      "(2017-07-04 23:13:42)>>>>>>>>>>>>>> Cleaning... (1731875, 4)\n",
+      "(2017-07-04 23:13:54)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 23:13:54)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:13:54)>>>>>>>>>>>>>>>> Drop OOB data | (1731794, 4)\n",
+      "(2017-07-04 23:13:55)>>>>>>>>>>>>>>>>>> temperature body, degF, 1734754\n",
+      "(2017-07-04 23:14:24)<<<<<<<<<<<<<<<<<< --- (29.0s)\n",
+      "(2017-07-04 23:14:24)<<<<<<<<<<<<<<<< --- (30.0s)\n",
+      "Data Loss (Extract > Cleaned): ((1751447, 1), (1731794, 4), 17226L, 156, '0.3189% records')\n",
+      "(2017-07-04 23:14:24)<<<<<<<<<<<<<< --- (42.0s)\n",
+      "(2017-07-04 23:14:24)>>>>>>>>>>>>>> Filter & sort - (1731794, 4)\n",
+      "(2017-07-04 23:14:25)<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 23:14:25)>>>>>>>>>>>>>> Convert to dask - (1731794, 4)\n",
+      "(2017-07-04 23:14:25)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:14:25)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 23:14:25)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:14:25)<<<<<<<<<<<< --- (131.0s)\n",
+      "(2017-07-04 23:14:25)>>>>>>>>>>>> OXYGEN SATURATION PULSE OXIMETRY: 7/8\n",
+      "(2017-07-04 23:14:25)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 23:14:25)>>>>>>>>>>>>>>>> Extracting 2 items from chartevents\n",
+      "(2017-07-04 23:15:41)<<<<<<<<<<<<<<<< --- (76.0s)\n",
+      "(2017-07-04 23:15:41)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 23:15:41)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:15:41)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 23:15:58)<<<<<<<<<<<<<<<< --- (17.0s)\n",
+      "(2017-07-04 23:15:58)<<<<<<<<<<<<<< --- (93.0s)\n",
+      "(2017-07-04 23:15:58)>>>>>>>>>>>>>> Transforming... (6099827, 5)\n",
+      "Data Loss (Extract > Transformed): ((6099827, 1), (6073540, 2), 26134L, 163, '0.3326% records')\n",
+      "(2017-07-04 23:17:28)<<<<<<<<<<<<<< --- (90.0s)\n",
+      "(2017-07-04 23:17:28)>>>>>>>>>>>>>> Cleaning... (6073540, 2)\n",
+      "(2017-07-04 23:18:01)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 23:18:01)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:18:01)>>>>>>>>>>>>>>>> Drop OOB data | (6073019, 2)\n",
+      "(2017-07-04 23:18:03)>>>>>>>>>>>>>>>>>> oxygen saturation pulse oximetry, percent, 6073172\n",
+      "(2017-07-04 23:18:54)<<<<<<<<<<<<<<<<<< --- (51.0s)\n",
+      "(2017-07-04 23:18:54)<<<<<<<<<<<<<<<< --- (53.0s)\n",
+      "Data Loss (Extract > Cleaned): ((6099827, 1), (6073019, 2), 26707L, 163, '0.3326% records')\n",
+      "(2017-07-04 23:18:55)<<<<<<<<<<<<<< --- (87.0s)\n",
+      "(2017-07-04 23:18:56)>>>>>>>>>>>>>> Filter & sort - (6073019, 2)\n",
+      "(2017-07-04 23:18:58)<<<<<<<<<<<<<< --- (2.0s)\n",
+      "(2017-07-04 23:18:58)>>>>>>>>>>>>>> Convert to dask - (6073019, 2)\n",
+      "(2017-07-04 23:18:59)<<<<<<<<<<<<<< --- (1.0s)\n",
+      "(2017-07-04 23:18:59)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 23:18:59)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:18:59)<<<<<<<<<<<< --- (274.0s)\n",
+      "(2017-07-04 23:18:59)>>>>>>>>>>>> WEIGHT BODY: 8/8\n",
+      "(2017-07-04 23:18:59)>>>>>>>>>>>>>> Extracting...\n",
+      "(2017-07-04 23:18:59)>>>>>>>>>>>>>>>> Extracting 3 items from chartevents\n",
+      "(2017-07-04 23:19:34)<<<<<<<<<<<<<<<< --- (35.0s)\n",
+      "(2017-07-04 23:19:34)>>>>>>>>>>>>>>>> Combine DF\n",
+      "(2017-07-04 23:19:34)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:19:34)>>>>>>>>>>>>>>>> Clean UOM\n",
+      "(2017-07-04 23:19:34)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:19:34)<<<<<<<<<<<<<< --- (35.0s)\n",
+      "(2017-07-04 23:19:34)>>>>>>>>>>>>>> Transforming... (95425, 5)\n",
+      "Data Loss (Extract > Transformed): ((95425, 1), (94484, 3), 941L, 158, '0.4958% records')\n",
+      "(2017-07-04 23:19:36)<<<<<<<<<<<<<< --- (2.0s)\n",
+      "(2017-07-04 23:19:36)>>>>>>>>>>>>>> Cleaning... (94484, 3)\n",
+      "(2017-07-04 23:19:37)>>>>>>>>>>>>>>>> Nominal to OneHot\n",
+      "(2017-07-04 23:19:37)<<<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:19:37)>>>>>>>>>>>>>>>> Drop OOB data | (94457, 3)\n",
+      "(2017-07-04 23:19:37)>>>>>>>>>>>>>>>>>> weight body, kg, 94457\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<<<<<<<< --- (5.0s)\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<<<<<< --- (5.0s)\n",
+      "Data Loss (Extract > Cleaned): ((95425, 1), (94457, 3), 979L, 158, '0.4958% records')\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (6.0s)\n",
+      "(2017-07-04 23:19:42)>>>>>>>>>>>>>> Filter & sort - (94457, 3)\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:19:42)>>>>>>>>>>>>>> Convert to dask - (94457, 3)\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:19:42)>>>>>>>>>>>>>> Join to big DF\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<<<< --- (0.0s)\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<<<< --- (43.0s)\n",
+      "(2017-07-04 23:19:42)<<<<<<<<<< --- (3087.0s)\n",
+      "(2017-07-04 23:19:42)<<<<<<<< --- (3087.0s)\n"
+     ]
+    }
+   ],
+   "source": [
+    "df_all = mimic.ETL(mimic.mimic_extractor('config/mimic_item_map.csv',data_dict),\n",
+    "                   components,\n",
+    "                   data_dict,\n",
+    "                   transformers.same_index_aggregator(agg_func=lambda x:x.iloc[0]))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Get all of the data we want and join into a single DF"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import utils\n",
+    "import logger\n",
+    "import transformers\n",
+    "import warnings\n",
+    "warnings.filterwarnings('ignore')\n",
+    "\n",
+    "def get_big_df(hdf5_fname,components):\n",
+    "    \n",
+    "    df_all = None\n",
+    "    logger.log('Make DF for {} components...\\n{}'.format(len(components),'\\n'.join(components)),new_level=True)\n",
+    "    for component in components:\n",
+    "        logger.log('{}: {}/{}'.format(component.upper(),components.index(component)+1,len(components)),new_level=True)\n",
+    "\n",
+    "        logger.log('Opening...')\n",
+    "        df = utils.open_df(hdf5_fname,'cleaned/{}'.format(component)).sort_index(axis=1).sort_index()\n",
+    "        display(df.describe(include='all'))\n",
+    "\n",
+    "        df_cleaned = transformers.remove_small_columns(threshold=5).fit_transform(df)\n",
+    "        \n",
+    "        display(df_cleaned.describe(include='all'))\n",
+    "\n",
+    "        print utils.data_loss(df,df_cleaned)\n",
+    "        \n",
+    "        logger.log('Join {} to {}'.format(df_cleaned.shape, None if df_all is None else df_all.shape))\n",
+    "        if df_all is None: df_all = df_cleaned\n",
+    "        else : \n",
+    "            df_all = df_all.join(df_cleaned,how='outer')\n",
+    "            del df,df_cleaned\n",
+    "        \n",
+    "        logger.end_log_level()\n",
+    "    logger.end_log()\n",
+    "\n",
+    "    return df_all"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import icu_data_defs\n",
+    "data_dict = icu_data_defs.data_dictionary('config/data_definitions.xlsx')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "components = data_dict.get_panel_defintions(12).component.unique().tolist()\n",
+    "components"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "#everything up to urine output\n",
+    "df1 = get_big_df('data/mimic_data',components[:8])\n",
+    "utils.save_df(df1,'data/mimic_data','cleaned/part1')\n",
+    "\n",
+    "#urine output and forward\n",
+    "df2 = get_big_df('data/mimic_data',components[8:])\n",
+    "utils.save_df(df2,'data/mimic_data','cleaned/part2')\n",
+    "\n",
+    "df_combined = df1.join(df2,how='outer')\n",
+    "\n",
+    "del df1,df2\n",
+    "df_all.shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "utils.save_df(df_combined,'data/mimic_data','cleaned/all')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Start here"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 70,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "\n",
+    "\n",
+    "def summable_filter(df):\n",
+    "    ureg = units.MedicalUreg()\n",
+    "    filter_func= lambda x: (ureg.is_volume(str(x[-2])) or ureg.is_mass(str(x[-2]))) and (x[0] != data_dict.labels.WEIGHT_BODY)\n",
+    "    return df.loc[:,df.columns.map(filter_func)]\n",
+    "\n",
+    "def lactate_filter_admissions(hdf5_fname)\n",
+    "\n",
+    "def make_lactate_labels(hdf5_fname,custom_cleaners,data_dict):\n",
+    "    df = utils.open_df(hdf5_fname,'cleaned/{}'.format(data_dict.labels.LACTATE))\n",
+    "    df_cleaned = custom_cleaners.transform(df)\n",
+    "    max_col_cleaner = transformers.max_col_only()\n",
+    "    df_cleaned = max_col_cleaner.transform(df_cleaned)\n",
+    "    df_cleaned.groupby(level=constants.column_names.ID).agg(lambda x: x.iloc[])\n",
+    "    \n",
+    "    \n",
+    "\n",
+    "basic_feature_tuples = [\n",
+    "    ('MEAN',features.segment_mean(),constants.ALL),\n",
+    "    ('STD',features.segment_std(),constants.ALL),\n",
+    "    ('COUNT',features.segment_count(),constants.ALL),\n",
+    "    ('LAST',features.segment_last(),constants.ALL),\n",
+    "    ('SUM',features.segment_sum(),{constants.CUSTOM_FILTER:summable_filter})\n",
+    "]\n",
+    "\n",
+    "custom_cleaners = Pipeline([\n",
+    "        ('drop_oob_values',transformers.oob_value_remover(data_dict)),\n",
+    "        ('drop_small_columns',transformers.remove_small_columns(threshold=50)),\n",
+    "        ('combine_like_columns',transformers.combine_like_cols()),\n",
+    "#         ('quantitative_only',transformers.filter_var_type(var_types_to_keep)),\n",
+    "#         ('known_col_only',transformers.known_col_only()),\n",
+    "    ])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "\n",
+    "\n",
+    "lactate_labels = make_lactate_labels(hdf5_fname,custom_cleaners)\n",
+    "\n",
+    "df_features = mimic_features(hdf5_fname,'basic_all_before',labels,custom_cleaners)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "anaconda-cloud": {},
+  "kernelspec": {
+   "display_name": "Python [Root]",
+   "language": "python",
+   "name": "Python [Root]"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}