Switch to unified view

a b/Structural Health monitoring.ipynb
1
{
2
 "cells": [
3
  {
4
   "cell_type": "code",
5
   "execution_count": 1,
6
   "id": "b9ff0033",
7
   "metadata": {
8
    "scrolled": true
9
   },
10
   "outputs": [],
11
   "source": [
12
    "import os\n",
13
    "import scipy.io\n",
14
    "import pandas as pd\n",
15
    "import numpy as np\n",
16
    "import seaborn as sns\n",
17
    "import matplotlib.pyplot as plt\n",
18
    "#list of files for october \n",
19
    "arr = os.listdir('./traindata_201910')\n",
20
    "#list of files for April\n",
21
    "arr2 = os.listdir('./traindata_201904')"
22
   ]
23
  },
24
  {
25
   "cell_type": "code",
26
   "execution_count": 13,
27
   "id": "98d246d3",
28
   "metadata": {},
29
   "outputs": [],
30
   "source": [
31
    "\n",
32
    "#looping to include all data in october month\n",
33
    "\n",
34
    "for j in range(len(arr)):\n",
35
    "    strain = []\n",
36
    "    time = []\n",
37
    "    mat = scipy.io.loadmat('./traindata_201910/'+arr[j])\n",
38
    "    for item in mat['predat_sg'][0][0][3]:\n",
39
    "        strain.append(item)\n",
40
    "    for item in mat['predat_sg'][0][0][0]:\n",
41
    "        #convert matlab time to date_timestamp before appending \n",
42
    "        time.append(pd.to_datetime(item-719529,unit='d').round('s')[0].date())\n",
43
    "    if j==0:\n",
44
    "        col_name = []\n",
45
    "        for i in range (1,17):\n",
46
    "            col_name.append(\"strain_\"+str(i))\n",
47
    "\n",
48
    "        #create datafrome to add the strain values\n",
49
    "        strain_oct = pd.DataFrame(strain, columns=col_name)\n",
50
    "        strain_oct.insert(0, 'timestamp', time)\n",
51
    "        strain_oct = strain_oct.groupby(['timestamp']).mean()\n",
52
    "    else:\n",
53
    "        temp = pd.DataFrame(strain, columns=col_name)\n",
54
    "        temp.insert(0,'timestamp',time)\n",
55
    "        temp = temp.groupby(['timestamp']).mean()\n",
56
    "        strain_oct = strain_oct.append(temp)\n"
57
   ]
58
  },
59
  {
60
   "cell_type": "code",
61
   "execution_count": 49,
62
   "id": "bf71e1d5",
63
   "metadata": {},
64
   "outputs": [],
65
   "source": [
66
    "#creating column names\n",
67
    "col_name = []\n",
68
    "for i in range (1,17):\n",
69
    "    col_name.append(\"strain_\"+str(i))\n",
70
    "\n",
71
    "#create datafrome to add the strain values\n",
72
    "strain_oct = pd.DataFrame(strain, columns=col_name)\n",
73
    "strain_oct.insert(0, 'timestamp', time)\n"
74
   ]
75
  },
76
  {
77
   "cell_type": "code",
78
   "execution_count": null,
79
   "id": "a1e7388f",
80
   "metadata": {},
81
   "outputs": [],
82
   "source": [
83
    "#convert matlab time to date_time stamp\n",
84
    "#dates = strain_oct['mat_time'].apply(lambda matlab_datenum: pd.to_datetime(matlab_datenum-719529,unit='d').round('s'))\n",
85
    "#strain_oct.insert(1, 'timestamp', dates)\n",
86
    "\n",
87
    "#group items with same timestamp values and apply mean on the strain values\n",
88
    "strain_oct = strain_oct.groupby(['timestamp']).mean().drop(['mat_time'], axis=1)"
89
   ]
90
  },
91
  {
92
   "cell_type": "code",
93
   "execution_count": 15,
94
   "id": "87f32135",
95
   "metadata": {},
96
   "outputs": [],
97
   "source": [
98
    "#save the dataframe to CSV file\n",
99
    "strain_oct.to_csv('daywise_oct.csv')"
100
   ]
101
  },
102
  {
103
   "cell_type": "code",
104
   "execution_count": 19,
105
   "id": "80976996",
106
   "metadata": {},
107
   "outputs": [],
108
   "source": [
109
    "#save the dataframe to .mat file\n",
110
    "import scipy.io as sio\n",
111
    "destination_folder_path = ''\n",
112
    "sio.savemat(os.path.join(destination_folder_path,'daywise_oct.mat'), {name: col.values for name, col in strain_oct.items()})"
113
   ]
114
  },
115
  {
116
   "cell_type": "code",
117
   "execution_count": 26,
118
   "id": "735f1765",
119
   "metadata": {},
120
   "outputs": [],
121
   "source": [
122
    "#looping to include all data in april month\n",
123
    "\n",
124
    "for j in range(len(arr2)):\n",
125
    "    strain = []\n",
126
    "    time = []\n",
127
    "    mat = scipy.io.loadmat('./traindata_201904/'+arr2[j])\n",
128
    "    for item in mat['predat_sg'][0][0][3]:\n",
129
    "        strain.append(item)\n",
130
    "    for item in mat['predat_sg'][0][0][0]:\n",
131
    "        #convert matlab time to date_timestamp before appending \n",
132
    "        time.append(pd.to_datetime(item-719529,unit='d').round('s')[0].date())\n",
133
    "    if j==0:\n",
134
    "        col_name = []\n",
135
    "        for i in range (1,17):\n",
136
    "            col_name.append(\"strain_\"+str(i))\n",
137
    "\n",
138
    "        #create datafrome to add the strain values\n",
139
    "        strain_apr = pd.DataFrame(strain, columns=col_name)\n",
140
    "        strain_apr.insert(0, 'timestamp', time)\n",
141
    "        strain_apr = strain_apr.groupby(['timestamp']).mean().reset_index()\n",
142
    "        strain_apr = strain_apr.groupby(['timestamp']).mean().reset_index()\n",
143
    "    else:\n",
144
    "        temp = pd.DataFrame(strain, columns=col_name)\n",
145
    "        temp.insert(0,'timestamp',time)\n",
146
    "        temp = temp.groupby(['timestamp']).mean()\n",
147
    "        strain_apr = strain_apr.append(temp)\n",
148
    "\n",
149
    "#save the dataframe to CSV file\n",
150
    "strain_apr.to_csv('daywise_apr.csv')\n",
151
    "\n",
152
    "#save the dataframe to .mat file\n",
153
    "import scipy.io as sio\n",
154
    "destination_folder_path = ''\n",
155
    "sio.savemat(os.path.join(destination_folder_path,'daywise_apr.mat'), {name: col.values for name, col in strain_apr.items()})"
156
   ]
157
  },
158
  {
159
   "cell_type": "code",
160
   "execution_count": 28,
161
   "id": "a62fa77b",
162
   "metadata": {},
163
   "outputs": [
164
    {
165
     "data": {
166
      "text/plain": [
167
       "[<matplotlib.lines.Line2D at 0x1feca1f0670>,\n",
168
       " <matplotlib.lines.Line2D at 0x1feca0447f0>,\n",
169
       " <matplotlib.lines.Line2D at 0x1feca044850>,\n",
170
       " <matplotlib.lines.Line2D at 0x1feca044a30>,\n",
171
       " <matplotlib.lines.Line2D at 0x1feca044b50>,\n",
172
       " <matplotlib.lines.Line2D at 0x1feca044c70>,\n",
173
       " <matplotlib.lines.Line2D at 0x1feca044d90>,\n",
174
       " <matplotlib.lines.Line2D at 0x1feca044eb0>,\n",
175
       " <matplotlib.lines.Line2D at 0x1feca044fd0>,\n",
176
       " <matplotlib.lines.Line2D at 0x1feca1ef130>,\n",
177
       " <matplotlib.lines.Line2D at 0x1feca1f0dc0>,\n",
178
       " <matplotlib.lines.Line2D at 0x1feca1ef250>,\n",
179
       " <matplotlib.lines.Line2D at 0x1feca1ef460>,\n",
180
       " <matplotlib.lines.Line2D at 0x1feca1ef580>,\n",
181
       " <matplotlib.lines.Line2D at 0x1feca1ef6a0>,\n",
182
       " <matplotlib.lines.Line2D at 0x1feca1ef7c0>]"
183
      ]
184
     },
185
     "execution_count": 28,
186
     "metadata": {},
187
     "output_type": "execute_result"
188
    },
189
    {
190
     "data": {
191
      "image/png": "\n",
192
      "text/plain": [
193
       "<Figure size 864x432 with 1 Axes>"
194
      ]
195
     },
196
     "metadata": {
197
      "needs_background": "light"
198
     },
199
     "output_type": "display_data"
200
    }
201
   ],
202
   "source": [
203
    "from matplotlib.pyplot import figure\n",
204
    "\n",
205
    "figure(figsize=(12, 6))\n",
206
    "plt.plot(strain_oct)\n"
207
   ]
208
  },
209
  {
210
   "cell_type": "code",
211
   "execution_count": 27,
212
   "id": "c363f44e",
213
   "metadata": {},
214
   "outputs": [
215
    {
216
     "data": {
217
      "text/plain": [
218
       "[<matplotlib.lines.Line2D at 0x1fec2c48dc0>,\n",
219
       " <matplotlib.lines.Line2D at 0x1fec5a7c190>,\n",
220
       " <matplotlib.lines.Line2D at 0x1fec5a7c1f0>,\n",
221
       " <matplotlib.lines.Line2D at 0x1fec5a7c3d0>,\n",
222
       " <matplotlib.lines.Line2D at 0x1fec5a7c4f0>,\n",
223
       " <matplotlib.lines.Line2D at 0x1fec5a7c610>,\n",
224
       " <matplotlib.lines.Line2D at 0x1fec5a7c730>,\n",
225
       " <matplotlib.lines.Line2D at 0x1fec5a7c850>,\n",
226
       " <matplotlib.lines.Line2D at 0x1fec5a7c970>,\n",
227
       " <matplotlib.lines.Line2D at 0x1fec5a7ca90>,\n",
228
       " <matplotlib.lines.Line2D at 0x1fec2de0880>,\n",
229
       " <matplotlib.lines.Line2D at 0x1fec5a7cbb0>,\n",
230
       " <matplotlib.lines.Line2D at 0x1fec5a7cdc0>,\n",
231
       " <matplotlib.lines.Line2D at 0x1fec5a7cee0>,\n",
232
       " <matplotlib.lines.Line2D at 0x1fec5a51040>,\n",
233
       " <matplotlib.lines.Line2D at 0x1fec5a51160>]"
234
      ]
235
     },
236
     "execution_count": 27,
237
     "metadata": {},
238
     "output_type": "execute_result"
239
    },
240
    {
241
     "data": {
242
      "image/png": "\n",
243
      "text/plain": [
244
       "<Figure size 864x432 with 1 Axes>"
245
      ]
246
     },
247
     "metadata": {
248
      "needs_background": "light"
249
     },
250
     "output_type": "display_data"
251
    }
252
   ],
253
   "source": [
254
    "figure(figsize=(12, 6))\n",
255
    "plt.plot(strain_apr)\n"
256
   ]
257
  },
258
  {
259
   "cell_type": "code",
260
   "execution_count": 33,
261
   "id": "47d81ba9",
262
   "metadata": {},
263
   "outputs": [],
264
   "source": [
265
    "df = pd.read_csv(\"daywise_oct.csv\")"
266
   ]
267
  },
268
  {
269
   "cell_type": "code",
270
   "execution_count": null,
271
   "id": "73a050ea",
272
   "metadata": {},
273
   "outputs": [],
274
   "source": [
275
    "x = df['timestamp']\n",
276
    "y = df['strain_1','strain_2']\n",
277
    "plt.scatter(x,y)"
278
   ]
279
  },
280
  {
281
   "cell_type": "code",
282
   "execution_count": 32,
283
   "id": "d42887da",
284
   "metadata": {},
285
   "outputs": [],
286
   "source": [
287
    "#find lag in the strain values (order = 1)\n",
288
    "mat = scipy.io.loadmat('./traindata_201810/'+arr[0])"
289
   ]
290
  },
291
  {
292
   "cell_type": "code",
293
   "execution_count": 41,
294
   "id": "177cf318",
295
   "metadata": {},
296
   "outputs": [
297
    {
298
     "data": {
299
      "text/plain": [
300
       "array([-3.39062644e-07, -2.76319165e-07,             nan,  2.19765438e-07,\n",
301
       "                   nan,             nan,  5.41557452e-07, -1.06885435e-07,\n",
302
       "                   nan,             nan,             nan,             nan,\n",
303
       "                   nan,             nan,             nan,             nan])"
304
      ]
305
     },
306
     "execution_count": 41,
307
     "metadata": {},
308
     "output_type": "execute_result"
309
    }
310
   ],
311
   "source": [
312
    "mat['predat_sg'][0][-1][-1][0]"
313
   ]
314
  },
315
  {
316
   "cell_type": "code",
317
   "execution_count": 32,
318
   "id": "1a4c2c62",
319
   "metadata": {},
320
   "outputs": [
321
    {
322
     "data": {
323
      "text/plain": [
324
       "array([[(array([[737335.67221965]]), array([[array(['tBD31A'], dtype='<U6')],\n",
325
       "               [array(['rhBD31A'], dtype='<U7')],\n",
326
       "               [array(['tVL'], dtype='<U3')],\n",
327
       "               [array(['rhVL'], dtype='<U4')],\n",
328
       "               [array(['vpVL'], dtype='<U4')],\n",
329
       "               [array(['grVL'], dtype='<U4')],\n",
330
       "               [array(['drVL'], dtype='<U4')],\n",
331
       "               [array(['dnrVL'], dtype='<U5')],\n",
332
       "               [array(['raVL'], dtype='<U4')],\n",
333
       "               [array(['wsVL'], dtype='<U4')],\n",
334
       "               [array(['wdVL'], dtype='<U4')]], dtype=object), array([[          nan,   71.28002926,   16.71666718,   74.5       ,\n",
335
       "                1417.87195067,           nan,           nan,           nan,\n",
336
       "                          nan,           nan,           nan]]))                                                                   ]],\n",
337
       "      dtype=[('sdn', 'O'), ('labels', 'O'), ('data', 'O')])"
338
      ]
339
     },
340
     "execution_count": 32,
341
     "metadata": {},
342
     "output_type": "execute_result"
343
    }
344
   ],
345
   "source": [
346
    "mat['predat_env']"
347
   ]
348
  },
349
  {
350
   "cell_type": "code",
351
   "execution_count": 52,
352
   "id": "606b26a4",
353
   "metadata": {},
354
   "outputs": [],
355
   "source": [
356
    "#looping to include all data in october month\n",
357
    "#LATEST\n",
358
    "for j in range(len(arr)):\n",
359
    "    strain = []\n",
360
    "    time = []\n",
361
    "    mat = scipy.io.loadmat('./traindata_201910/'+arr[j])\n",
362
    "    for item in mat['predat_sg'][0][0][3]:\n",
363
    "        strain.append(item)\n",
364
    "    for item in mat['predat_sg'][0][0][0]:\n",
365
    "        #convert matlab time to date_timestamp before appending \n",
366
    "        time.append(pd.to_datetime(item-719529,unit='d').round('s')[0].date())\n",
367
    "    if j==0:\n",
368
    "        col_name = []\n",
369
    "        for i in range (1,17):\n",
370
    "            col_name.append(\"strain_\"+str(i))\n",
371
    "    \n",
372
    "        #create datafrome to add the strain values\n",
373
    "        strain_oct = pd.DataFrame(strain, columns=col_name)\n",
374
    "        strain_oct.insert(0, 'timestamp', time)\n",
375
    "        strain_oct = strain_oct.groupby(['timestamp']).mean()\n",
376
    "        strain_oct['Surftemp'] = mat['predat_env'][0][0][-1][0][0] #Surface temperature at one point below deck\n",
377
    "        strain_oct['Rh'] = mat['predat_env'][0][0][-1][0][1] #Relative humidity at one point below deck\n",
378
    "        strain_oct['airtemp'] = mat['predat_env'][0][0][-1][0][2] #Average air temperature\n",
379
    "        strain_oct['avgRh'] = mat['predat_env'][0][0][-1][0][3] #Average Relative Humidity\n",
380
    "        strain_oct['avgVPr'] = mat['predat_env'][0][0][-1][0][4] #Average Vapour Pressure\n",
381
    "        strain_oct['avgGR'] = mat['predat_env'][0][0][-1][0][5] #Average global Radiation\n",
382
    "        strain_oct['avgdR']= mat['predat_env'][0][0][-1][0][6] #Average diffuse radiation\n",
383
    "        strain_oct['avgdnr'] = mat['predat_env'][0][0][-1][0][7] #Average Direct normal radiation\n",
384
    "        strain_oct['totalrain'] = mat['predat_env'][0][0][-1][0][8] #Total Rain\n",
385
    "        strain_oct['avgws10'] = mat['predat_env'][0][0][-1][0][9] #wind speed at 10m above ground\n",
386
    "        strain_oct['avgwd10'] = mat['predat_env'][0][0][-1][0][10] #wind direction at 10m above ground\n",
387
    "    else:\n",
388
    "        temp = pd.DataFrame(strain, columns=col_name)\n",
389
    "        temp.insert(0,'timestamp',time)\n",
390
    "        temp = temp.groupby(['timestamp']).mean()\n",
391
    "        temp['Surftemp'] = mat['predat_env'][0][0][-1][0][0] #Surface temperature at one point below deck\n",
392
    "        temp['Rh'] = mat['predat_env'][0][0][-1][0][1] #Relative humidity at one point below deck\n",
393
    "        temp['airtemp'] = mat['predat_env'][0][0][-1][0][2] #Average air temperature\n",
394
    "        temp['avgRh'] = mat['predat_env'][0][0][-1][0][3] #Average Relative Humidity\n",
395
    "        temp['avgVPr'] = mat['predat_env'][0][0][-1][0][4] #Average Vapour Pressure\n",
396
    "        temp['avgGR'] = mat['predat_env'][0][0][-1][0][5] #Average global Radiation\n",
397
    "        temp['avgdR']= mat['predat_env'][0][0][-1][0][6] #Average diffuse radiation\n",
398
    "        temp['avgdnr'] = mat['predat_env'][0][0][-1][0][7] #Average Direct normal radiation\n",
399
    "        temp['totalrain'] = mat['predat_env'][0][0][-1][0][8] #Total Rain\n",
400
    "        temp['avgws10'] = mat['predat_env'][0][0][-1][0][9] #wind speed at 10m above ground\n",
401
    "        temp['avgwd10'] = mat['predat_env'][0][0][-1][0][10] #wind direction at 10m above ground\n",
402
    "        strain_oct = strain_oct.append(temp)\n",
403
    "\n",
404
    "#save the dataframe to CSV file\n",
405
    "strain_oct.to_csv('daywise_oct_with_env2_final.csv')"
406
   ]
407
  },
408
  {
409
   "cell_type": "code",
410
   "execution_count": 37,
411
   "id": "48bd39a0",
412
   "metadata": {},
413
   "outputs": [],
414
   "source": [
415
    "df1 = pd.read_csv(\"daywise_oct_with_env.csv\")"
416
   ]
417
  },
418
  {
419
   "cell_type": "code",
420
   "execution_count": 38,
421
   "id": "af9780af",
422
   "metadata": {},
423
   "outputs": [
424
    {
425
     "data": {
426
      "text/html": [
427
       "<div>\n",
428
       "<style scoped>\n",
429
       "    .dataframe tbody tr th:only-of-type {\n",
430
       "        vertical-align: middle;\n",
431
       "    }\n",
432
       "\n",
433
       "    .dataframe tbody tr th {\n",
434
       "        vertical-align: top;\n",
435
       "    }\n",
436
       "\n",
437
       "    .dataframe thead th {\n",
438
       "        text-align: right;\n",
439
       "    }\n",
440
       "</style>\n",
441
       "<table border=\"1\" class=\"dataframe\">\n",
442
       "  <thead>\n",
443
       "    <tr style=\"text-align: right;\">\n",
444
       "      <th></th>\n",
445
       "      <th>timestamp</th>\n",
446
       "      <th>strain_1</th>\n",
447
       "      <th>strain_2</th>\n",
448
       "      <th>strain_3</th>\n",
449
       "      <th>strain_4</th>\n",
450
       "      <th>strain_5</th>\n",
451
       "      <th>strain_6</th>\n",
452
       "      <th>strain_7</th>\n",
453
       "      <th>strain_8</th>\n",
454
       "      <th>strain_9</th>\n",
455
       "      <th>...</th>\n",
456
       "      <th>Rh</th>\n",
457
       "      <th>airtemp</th>\n",
458
       "      <th>avgRh</th>\n",
459
       "      <th>avgVPr</th>\n",
460
       "      <th>avgGR</th>\n",
461
       "      <th>avgdR</th>\n",
462
       "      <th>avgdnr</th>\n",
463
       "      <th>totalrain</th>\n",
464
       "      <th>avgws10</th>\n",
465
       "      <th>avgwd10</th>\n",
466
       "    </tr>\n",
467
       "  </thead>\n",
468
       "  <tbody>\n",
469
       "    <tr>\n",
470
       "      <th>0</th>\n",
471
       "      <td>2018-10-02</td>\n",
472
       "      <td>1.804882e-06</td>\n",
473
       "      <td>1.291150e-06</td>\n",
474
       "      <td>NaN</td>\n",
475
       "      <td>0.000003</td>\n",
476
       "      <td>NaN</td>\n",
477
       "      <td>NaN</td>\n",
478
       "      <td>0.000003</td>\n",
479
       "      <td>5.482034e-06</td>\n",
480
       "      <td>NaN</td>\n",
481
       "      <td>...</td>\n",
482
       "      <td>71.280029</td>\n",
483
       "      <td>16.716667</td>\n",
484
       "      <td>74.500000</td>\n",
485
       "      <td>1417.871951</td>\n",
486
       "      <td>NaN</td>\n",
487
       "      <td>NaN</td>\n",
488
       "      <td>NaN</td>\n",
489
       "      <td>NaN</td>\n",
490
       "      <td>NaN</td>\n",
491
       "      <td>NaN</td>\n",
492
       "    </tr>\n",
493
       "    <tr>\n",
494
       "      <th>1</th>\n",
495
       "      <td>2018-10-03</td>\n",
496
       "      <td>2.269802e-06</td>\n",
497
       "      <td>1.698958e-06</td>\n",
498
       "      <td>NaN</td>\n",
499
       "      <td>0.000004</td>\n",
500
       "      <td>NaN</td>\n",
501
       "      <td>NaN</td>\n",
502
       "      <td>0.000003</td>\n",
503
       "      <td>5.813794e-06</td>\n",
504
       "      <td>NaN</td>\n",
505
       "      <td>...</td>\n",
506
       "      <td>76.997064</td>\n",
507
       "      <td>12.141666</td>\n",
508
       "      <td>79.166664</td>\n",
509
       "      <td>1120.819324</td>\n",
510
       "      <td>NaN</td>\n",
511
       "      <td>NaN</td>\n",
512
       "      <td>NaN</td>\n",
513
       "      <td>NaN</td>\n",
514
       "      <td>NaN</td>\n",
515
       "      <td>NaN</td>\n",
516
       "    </tr>\n",
517
       "    <tr>\n",
518
       "      <th>2</th>\n",
519
       "      <td>2018-10-03</td>\n",
520
       "      <td>2.128605e-06</td>\n",
521
       "      <td>1.411400e-06</td>\n",
522
       "      <td>NaN</td>\n",
523
       "      <td>0.000003</td>\n",
524
       "      <td>NaN</td>\n",
525
       "      <td>NaN</td>\n",
526
       "      <td>0.000002</td>\n",
527
       "      <td>5.213818e-06</td>\n",
528
       "      <td>NaN</td>\n",
529
       "      <td>...</td>\n",
530
       "      <td>55.975091</td>\n",
531
       "      <td>15.683333</td>\n",
532
       "      <td>61.250000</td>\n",
533
       "      <td>1091.387360</td>\n",
534
       "      <td>NaN</td>\n",
535
       "      <td>NaN</td>\n",
536
       "      <td>NaN</td>\n",
537
       "      <td>NaN</td>\n",
538
       "      <td>NaN</td>\n",
539
       "      <td>NaN</td>\n",
540
       "    </tr>\n",
541
       "    <tr>\n",
542
       "      <th>3</th>\n",
543
       "      <td>2018-10-04</td>\n",
544
       "      <td>3.457613e-06</td>\n",
545
       "      <td>2.919155e-06</td>\n",
546
       "      <td>NaN</td>\n",
547
       "      <td>0.000004</td>\n",
548
       "      <td>NaN</td>\n",
549
       "      <td>NaN</td>\n",
550
       "      <td>0.000004</td>\n",
551
       "      <td>8.611123e-06</td>\n",
552
       "      <td>NaN</td>\n",
553
       "      <td>...</td>\n",
554
       "      <td>79.072215</td>\n",
555
       "      <td>12.958333</td>\n",
556
       "      <td>83.083336</td>\n",
557
       "      <td>1241.060048</td>\n",
558
       "      <td>NaN</td>\n",
559
       "      <td>NaN</td>\n",
560
       "      <td>NaN</td>\n",
561
       "      <td>NaN</td>\n",
562
       "      <td>NaN</td>\n",
563
       "      <td>NaN</td>\n",
564
       "    </tr>\n",
565
       "    <tr>\n",
566
       "      <th>4</th>\n",
567
       "      <td>2018-10-04</td>\n",
568
       "      <td>1.420150e-07</td>\n",
569
       "      <td>-5.852899e-07</td>\n",
570
       "      <td>NaN</td>\n",
571
       "      <td>0.000005</td>\n",
572
       "      <td>NaN</td>\n",
573
       "      <td>NaN</td>\n",
574
       "      <td>0.000005</td>\n",
575
       "      <td>7.968894e-07</td>\n",
576
       "      <td>NaN</td>\n",
577
       "      <td>...</td>\n",
578
       "      <td>58.432998</td>\n",
579
       "      <td>21.924999</td>\n",
580
       "      <td>54.500000</td>\n",
581
       "      <td>1433.934434</td>\n",
582
       "      <td>NaN</td>\n",
583
       "      <td>NaN</td>\n",
584
       "      <td>NaN</td>\n",
585
       "      <td>NaN</td>\n",
586
       "      <td>NaN</td>\n",
587
       "      <td>NaN</td>\n",
588
       "    </tr>\n",
589
       "    <tr>\n",
590
       "      <th>5</th>\n",
591
       "      <td>2018-10-05</td>\n",
592
       "      <td>1.282716e-06</td>\n",
593
       "      <td>2.430030e-07</td>\n",
594
       "      <td>NaN</td>\n",
595
       "      <td>0.000008</td>\n",
596
       "      <td>NaN</td>\n",
597
       "      <td>NaN</td>\n",
598
       "      <td>0.000007</td>\n",
599
       "      <td>4.326709e-06</td>\n",
600
       "      <td>NaN</td>\n",
601
       "      <td>...</td>\n",
602
       "      <td>77.300284</td>\n",
603
       "      <td>9.525000</td>\n",
604
       "      <td>92.833336</td>\n",
605
       "      <td>1104.173129</td>\n",
606
       "      <td>NaN</td>\n",
607
       "      <td>NaN</td>\n",
608
       "      <td>NaN</td>\n",
609
       "      <td>NaN</td>\n",
610
       "      <td>NaN</td>\n",
611
       "      <td>NaN</td>\n",
612
       "    </tr>\n",
613
       "    <tr>\n",
614
       "      <th>6</th>\n",
615
       "      <td>2018-10-05</td>\n",
616
       "      <td>-3.599416e-07</td>\n",
617
       "      <td>-1.080711e-06</td>\n",
618
       "      <td>NaN</td>\n",
619
       "      <td>0.000005</td>\n",
620
       "      <td>NaN</td>\n",
621
       "      <td>NaN</td>\n",
622
       "      <td>0.000004</td>\n",
623
       "      <td>1.512664e-06</td>\n",
624
       "      <td>NaN</td>\n",
625
       "      <td>...</td>\n",
626
       "      <td>47.062426</td>\n",
627
       "      <td>23.875000</td>\n",
628
       "      <td>45.583332</td>\n",
629
       "      <td>1349.343321</td>\n",
630
       "      <td>NaN</td>\n",
631
       "      <td>NaN</td>\n",
632
       "      <td>NaN</td>\n",
633
       "      <td>NaN</td>\n",
634
       "      <td>NaN</td>\n",
635
       "      <td>NaN</td>\n",
636
       "    </tr>\n",
637
       "    <tr>\n",
638
       "      <th>7</th>\n",
639
       "      <td>2018-10-06</td>\n",
640
       "      <td>3.045380e-06</td>\n",
641
       "      <td>2.472536e-06</td>\n",
642
       "      <td>NaN</td>\n",
643
       "      <td>0.000006</td>\n",
644
       "      <td>NaN</td>\n",
645
       "      <td>NaN</td>\n",
646
       "      <td>0.000005</td>\n",
647
       "      <td>6.635354e-06</td>\n",
648
       "      <td>NaN</td>\n",
649
       "      <td>...</td>\n",
650
       "      <td>78.543308</td>\n",
651
       "      <td>11.433333</td>\n",
652
       "      <td>90.500000</td>\n",
653
       "      <td>1222.699295</td>\n",
654
       "      <td>NaN</td>\n",
655
       "      <td>NaN</td>\n",
656
       "      <td>NaN</td>\n",
657
       "      <td>NaN</td>\n",
658
       "      <td>NaN</td>\n",
659
       "      <td>NaN</td>\n",
660
       "    </tr>\n",
661
       "    <tr>\n",
662
       "      <th>8</th>\n",
663
       "      <td>2018-10-08</td>\n",
664
       "      <td>-4.537585e-07</td>\n",
665
       "      <td>-1.072013e-06</td>\n",
666
       "      <td>NaN</td>\n",
667
       "      <td>0.000006</td>\n",
668
       "      <td>NaN</td>\n",
669
       "      <td>NaN</td>\n",
670
       "      <td>0.000005</td>\n",
671
       "      <td>8.118908e-07</td>\n",
672
       "      <td>NaN</td>\n",
673
       "      <td>...</td>\n",
674
       "      <td>73.230142</td>\n",
675
       "      <td>5.833333</td>\n",
676
       "      <td>91.916664</td>\n",
677
       "      <td>849.545823</td>\n",
678
       "      <td>NaN</td>\n",
679
       "      <td>NaN</td>\n",
680
       "      <td>NaN</td>\n",
681
       "      <td>NaN</td>\n",
682
       "      <td>NaN</td>\n",
683
       "      <td>NaN</td>\n",
684
       "    </tr>\n",
685
       "    <tr>\n",
686
       "      <th>9</th>\n",
687
       "      <td>2018-10-08</td>\n",
688
       "      <td>-1.061381e-07</td>\n",
689
       "      <td>-7.471682e-07</td>\n",
690
       "      <td>NaN</td>\n",
691
       "      <td>0.000005</td>\n",
692
       "      <td>NaN</td>\n",
693
       "      <td>NaN</td>\n",
694
       "      <td>0.000005</td>\n",
695
       "      <td>6.869932e-07</td>\n",
696
       "      <td>NaN</td>\n",
697
       "      <td>...</td>\n",
698
       "      <td>52.548953</td>\n",
699
       "      <td>15.975000</td>\n",
700
       "      <td>56.000000</td>\n",
701
       "      <td>1016.622559</td>\n",
702
       "      <td>NaN</td>\n",
703
       "      <td>NaN</td>\n",
704
       "      <td>NaN</td>\n",
705
       "      <td>NaN</td>\n",
706
       "      <td>NaN</td>\n",
707
       "      <td>NaN</td>\n",
708
       "    </tr>\n",
709
       "    <tr>\n",
710
       "      <th>10</th>\n",
711
       "      <td>2018-10-09</td>\n",
712
       "      <td>1.628155e-06</td>\n",
713
       "      <td>1.257122e-06</td>\n",
714
       "      <td>NaN</td>\n",
715
       "      <td>0.000004</td>\n",
716
       "      <td>NaN</td>\n",
717
       "      <td>NaN</td>\n",
718
       "      <td>0.000004</td>\n",
719
       "      <td>5.748393e-06</td>\n",
720
       "      <td>NaN</td>\n",
721
       "      <td>...</td>\n",
722
       "      <td>77.955239</td>\n",
723
       "      <td>6.358333</td>\n",
724
       "      <td>92.833336</td>\n",
725
       "      <td>889.771595</td>\n",
726
       "      <td>NaN</td>\n",
727
       "      <td>NaN</td>\n",
728
       "      <td>NaN</td>\n",
729
       "      <td>NaN</td>\n",
730
       "      <td>NaN</td>\n",
731
       "      <td>NaN</td>\n",
732
       "    </tr>\n",
733
       "    <tr>\n",
734
       "      <th>11</th>\n",
735
       "      <td>2018-10-09</td>\n",
736
       "      <td>-3.682028e-07</td>\n",
737
       "      <td>-1.007747e-06</td>\n",
738
       "      <td>NaN</td>\n",
739
       "      <td>0.000005</td>\n",
740
       "      <td>NaN</td>\n",
741
       "      <td>NaN</td>\n",
742
       "      <td>0.000005</td>\n",
743
       "      <td>5.841734e-07</td>\n",
744
       "      <td>NaN</td>\n",
745
       "      <td>...</td>\n",
746
       "      <td>56.269163</td>\n",
747
       "      <td>18.052333</td>\n",
748
       "      <td>57.583332</td>\n",
749
       "      <td>1192.356382</td>\n",
750
       "      <td>20.417556</td>\n",
751
       "      <td>18.671694</td>\n",
752
       "      <td>16.358833</td>\n",
753
       "      <td>0.0</td>\n",
754
       "      <td>NaN</td>\n",
755
       "      <td>NaN</td>\n",
756
       "    </tr>\n",
757
       "    <tr>\n",
758
       "      <th>12</th>\n",
759
       "      <td>2018-10-10</td>\n",
760
       "      <td>-4.486108e-07</td>\n",
761
       "      <td>-1.049204e-06</td>\n",
762
       "      <td>NaN</td>\n",
763
       "      <td>0.000005</td>\n",
764
       "      <td>NaN</td>\n",
765
       "      <td>NaN</td>\n",
766
       "      <td>0.000005</td>\n",
767
       "      <td>4.158732e-07</td>\n",
768
       "      <td>NaN</td>\n",
769
       "      <td>...</td>\n",
770
       "      <td>81.122389</td>\n",
771
       "      <td>9.398639</td>\n",
772
       "      <td>93.750000</td>\n",
773
       "      <td>1105.629785</td>\n",
774
       "      <td>157.019694</td>\n",
775
       "      <td>66.948917</td>\n",
776
       "      <td>407.837417</td>\n",
777
       "      <td>0.0</td>\n",
778
       "      <td>NaN</td>\n",
779
       "      <td>NaN</td>\n",
780
       "    </tr>\n",
781
       "    <tr>\n",
782
       "      <th>13</th>\n",
783
       "      <td>2018-10-10</td>\n",
784
       "      <td>-3.506244e-07</td>\n",
785
       "      <td>-9.312912e-07</td>\n",
786
       "      <td>NaN</td>\n",
787
       "      <td>0.000004</td>\n",
788
       "      <td>-8.837225e-07</td>\n",
789
       "      <td>NaN</td>\n",
790
       "      <td>0.000004</td>\n",
791
       "      <td>5.287465e-07</td>\n",
792
       "      <td>NaN</td>\n",
793
       "      <td>...</td>\n",
794
       "      <td>54.889717</td>\n",
795
       "      <td>23.548417</td>\n",
796
       "      <td>56.416668</td>\n",
797
       "      <td>1637.594616</td>\n",
798
       "      <td>30.327806</td>\n",
799
       "      <td>16.180389</td>\n",
800
       "      <td>63.654694</td>\n",
801
       "      <td>0.0</td>\n",
802
       "      <td>NaN</td>\n",
803
       "      <td>NaN</td>\n",
804
       "    </tr>\n",
805
       "    <tr>\n",
806
       "      <th>14</th>\n",
807
       "      <td>2018-10-11</td>\n",
808
       "      <td>9.078712e-08</td>\n",
809
       "      <td>-6.254588e-07</td>\n",
810
       "      <td>NaN</td>\n",
811
       "      <td>0.000007</td>\n",
812
       "      <td>-5.223130e-07</td>\n",
813
       "      <td>NaN</td>\n",
814
       "      <td>0.000007</td>\n",
815
       "      <td>1.800594e-06</td>\n",
816
       "      <td>NaN</td>\n",
817
       "      <td>...</td>\n",
818
       "      <td>72.342233</td>\n",
819
       "      <td>19.004861</td>\n",
820
       "      <td>76.500000</td>\n",
821
       "      <td>1681.335790</td>\n",
822
       "      <td>31.314111</td>\n",
823
       "      <td>27.076306</td>\n",
824
       "      <td>0.377667</td>\n",
825
       "      <td>0.0</td>\n",
826
       "      <td>NaN</td>\n",
827
       "      <td>NaN</td>\n",
828
       "    </tr>\n",
829
       "    <tr>\n",
830
       "      <th>15</th>\n",
831
       "      <td>2018-10-11</td>\n",
832
       "      <td>-5.495572e-07</td>\n",
833
       "      <td>-1.042136e-06</td>\n",
834
       "      <td>NaN</td>\n",
835
       "      <td>0.000005</td>\n",
836
       "      <td>-6.461451e-07</td>\n",
837
       "      <td>NaN</td>\n",
838
       "      <td>0.000005</td>\n",
839
       "      <td>8.852473e-07</td>\n",
840
       "      <td>NaN</td>\n",
841
       "      <td>...</td>\n",
842
       "      <td>53.908886</td>\n",
843
       "      <td>24.208334</td>\n",
844
       "      <td>55.916668</td>\n",
845
       "      <td>1688.607212</td>\n",
846
       "      <td>NaN</td>\n",
847
       "      <td>NaN</td>\n",
848
       "      <td>NaN</td>\n",
849
       "      <td>NaN</td>\n",
850
       "      <td>NaN</td>\n",
851
       "      <td>NaN</td>\n",
852
       "    </tr>\n",
853
       "    <tr>\n",
854
       "      <th>16</th>\n",
855
       "      <td>2018-10-12</td>\n",
856
       "      <td>2.827529e-06</td>\n",
857
       "      <td>2.354601e-06</td>\n",
858
       "      <td>NaN</td>\n",
859
       "      <td>0.000004</td>\n",
860
       "      <td>3.245773e-06</td>\n",
861
       "      <td>NaN</td>\n",
862
       "      <td>0.000004</td>\n",
863
       "      <td>6.803631e-06</td>\n",
864
       "      <td>NaN</td>\n",
865
       "      <td>...</td>\n",
866
       "      <td>83.950116</td>\n",
867
       "      <td>17.993750</td>\n",
868
       "      <td>89.166664</td>\n",
869
       "      <td>1839.557833</td>\n",
870
       "      <td>140.983056</td>\n",
871
       "      <td>78.890306</td>\n",
872
       "      <td>214.392639</td>\n",
873
       "      <td>0.0</td>\n",
874
       "      <td>NaN</td>\n",
875
       "      <td>NaN</td>\n",
876
       "    </tr>\n",
877
       "    <tr>\n",
878
       "      <th>17</th>\n",
879
       "      <td>2018-10-12</td>\n",
880
       "      <td>1.409051e-06</td>\n",
881
       "      <td>8.248487e-07</td>\n",
882
       "      <td>NaN</td>\n",
883
       "      <td>0.000006</td>\n",
884
       "      <td>1.552718e-06</td>\n",
885
       "      <td>NaN</td>\n",
886
       "      <td>0.000006</td>\n",
887
       "      <td>5.098572e-06</td>\n",
888
       "      <td>NaN</td>\n",
889
       "      <td>...</td>\n",
890
       "      <td>64.288978</td>\n",
891
       "      <td>23.465000</td>\n",
892
       "      <td>67.250000</td>\n",
893
       "      <td>1942.281645</td>\n",
894
       "      <td>30.878333</td>\n",
895
       "      <td>27.683333</td>\n",
896
       "      <td>9.416667</td>\n",
897
       "      <td>0.0</td>\n",
898
       "      <td>NaN</td>\n",
899
       "      <td>NaN</td>\n",
900
       "    </tr>\n",
901
       "    <tr>\n",
902
       "      <th>18</th>\n",
903
       "      <td>2018-10-15</td>\n",
904
       "      <td>2.527285e-06</td>\n",
905
       "      <td>2.073035e-06</td>\n",
906
       "      <td>NaN</td>\n",
907
       "      <td>0.000002</td>\n",
908
       "      <td>2.815451e-06</td>\n",
909
       "      <td>NaN</td>\n",
910
       "      <td>0.000002</td>\n",
911
       "      <td>4.371978e-06</td>\n",
912
       "      <td>NaN</td>\n",
913
       "      <td>...</td>\n",
914
       "      <td>59.638465</td>\n",
915
       "      <td>19.570000</td>\n",
916
       "      <td>63.250000</td>\n",
917
       "      <td>1439.851964</td>\n",
918
       "      <td>90.183333</td>\n",
919
       "      <td>85.575000</td>\n",
920
       "      <td>3.056667</td>\n",
921
       "      <td>0.0</td>\n",
922
       "      <td>NaN</td>\n",
923
       "      <td>NaN</td>\n",
924
       "    </tr>\n",
925
       "    <tr>\n",
926
       "      <th>19</th>\n",
927
       "      <td>2018-10-15</td>\n",
928
       "      <td>-4.270678e-07</td>\n",
929
       "      <td>-1.003826e-06</td>\n",
930
       "      <td>NaN</td>\n",
931
       "      <td>0.000005</td>\n",
932
       "      <td>-6.829385e-07</td>\n",
933
       "      <td>NaN</td>\n",
934
       "      <td>0.000005</td>\n",
935
       "      <td>7.821662e-07</td>\n",
936
       "      <td>NaN</td>\n",
937
       "      <td>...</td>\n",
938
       "      <td>41.219275</td>\n",
939
       "      <td>22.181667</td>\n",
940
       "      <td>44.416668</td>\n",
941
       "      <td>1187.027705</td>\n",
942
       "      <td>9.636667</td>\n",
943
       "      <td>12.235000</td>\n",
944
       "      <td>0.311667</td>\n",
945
       "      <td>0.0</td>\n",
946
       "      <td>NaN</td>\n",
947
       "      <td>NaN</td>\n",
948
       "    </tr>\n",
949
       "    <tr>\n",
950
       "      <th>20</th>\n",
951
       "      <td>2018-10-16</td>\n",
952
       "      <td>1.935912e-06</td>\n",
953
       "      <td>1.531248e-06</td>\n",
954
       "      <td>NaN</td>\n",
955
       "      <td>0.000004</td>\n",
956
       "      <td>2.574173e-06</td>\n",
957
       "      <td>NaN</td>\n",
958
       "      <td>0.000003</td>\n",
959
       "      <td>6.310965e-06</td>\n",
960
       "      <td>NaN</td>\n",
961
       "      <td>...</td>\n",
962
       "      <td>71.332262</td>\n",
963
       "      <td>11.291667</td>\n",
964
       "      <td>86.583336</td>\n",
965
       "      <td>1158.849084</td>\n",
966
       "      <td>149.348333</td>\n",
967
       "      <td>65.840000</td>\n",
968
       "      <td>435.375000</td>\n",
969
       "      <td>0.0</td>\n",
970
       "      <td>NaN</td>\n",
971
       "      <td>NaN</td>\n",
972
       "    </tr>\n",
973
       "    <tr>\n",
974
       "      <th>21</th>\n",
975
       "      <td>2018-10-16</td>\n",
976
       "      <td>-3.912998e-07</td>\n",
977
       "      <td>-9.402715e-07</td>\n",
978
       "      <td>NaN</td>\n",
979
       "      <td>0.000005</td>\n",
980
       "      <td>-8.452086e-07</td>\n",
981
       "      <td>NaN</td>\n",
982
       "      <td>0.000005</td>\n",
983
       "      <td>8.549726e-07</td>\n",
984
       "      <td>NaN</td>\n",
985
       "      <td>...</td>\n",
986
       "      <td>43.499465</td>\n",
987
       "      <td>22.855000</td>\n",
988
       "      <td>40.916668</td>\n",
989
       "      <td>1139.047585</td>\n",
990
       "      <td>22.431667</td>\n",
991
       "      <td>25.788333</td>\n",
992
       "      <td>0.680000</td>\n",
993
       "      <td>0.0</td>\n",
994
       "      <td>NaN</td>\n",
995
       "      <td>NaN</td>\n",
996
       "    </tr>\n",
997
       "    <tr>\n",
998
       "      <th>22</th>\n",
999
       "      <td>2018-10-17</td>\n",
1000
       "      <td>2.287292e-06</td>\n",
1001
       "      <td>1.759895e-06</td>\n",
1002
       "      <td>NaN</td>\n",
1003
       "      <td>0.000004</td>\n",
1004
       "      <td>2.737282e-06</td>\n",
1005
       "      <td>NaN</td>\n",
1006
       "      <td>0.000004</td>\n",
1007
       "      <td>5.843397e-06</td>\n",
1008
       "      <td>NaN</td>\n",
1009
       "      <td>...</td>\n",
1010
       "      <td>75.164982</td>\n",
1011
       "      <td>11.135000</td>\n",
1012
       "      <td>90.833336</td>\n",
1013
       "      <td>1203.156142</td>\n",
1014
       "      <td>126.298333</td>\n",
1015
       "      <td>78.948333</td>\n",
1016
       "      <td>177.325000</td>\n",
1017
       "      <td>0.0</td>\n",
1018
       "      <td>NaN</td>\n",
1019
       "      <td>NaN</td>\n",
1020
       "    </tr>\n",
1021
       "    <tr>\n",
1022
       "      <th>23</th>\n",
1023
       "      <td>2018-10-17</td>\n",
1024
       "      <td>-6.658138e-07</td>\n",
1025
       "      <td>-1.174673e-06</td>\n",
1026
       "      <td>NaN</td>\n",
1027
       "      <td>0.000006</td>\n",
1028
       "      <td>-9.838982e-07</td>\n",
1029
       "      <td>NaN</td>\n",
1030
       "      <td>0.000005</td>\n",
1031
       "      <td>8.058195e-07</td>\n",
1032
       "      <td>NaN</td>\n",
1033
       "      <td>...</td>\n",
1034
       "      <td>65.386193</td>\n",
1035
       "      <td>18.858334</td>\n",
1036
       "      <td>71.166664</td>\n",
1037
       "      <td>1549.889447</td>\n",
1038
       "      <td>NaN</td>\n",
1039
       "      <td>NaN</td>\n",
1040
       "      <td>NaN</td>\n",
1041
       "      <td>NaN</td>\n",
1042
       "      <td>NaN</td>\n",
1043
       "      <td>NaN</td>\n",
1044
       "    </tr>\n",
1045
       "    <tr>\n",
1046
       "      <th>24</th>\n",
1047
       "      <td>2018-10-18</td>\n",
1048
       "      <td>1.756547e-06</td>\n",
1049
       "      <td>1.209365e-06</td>\n",
1050
       "      <td>NaN</td>\n",
1051
       "      <td>0.000004</td>\n",
1052
       "      <td>2.360669e-06</td>\n",
1053
       "      <td>NaN</td>\n",
1054
       "      <td>0.000003</td>\n",
1055
       "      <td>5.703489e-06</td>\n",
1056
       "      <td>NaN</td>\n",
1057
       "      <td>...</td>\n",
1058
       "      <td>84.501079</td>\n",
1059
       "      <td>12.526667</td>\n",
1060
       "      <td>94.500000</td>\n",
1061
       "      <td>1372.213888</td>\n",
1062
       "      <td>104.860000</td>\n",
1063
       "      <td>89.093333</td>\n",
1064
       "      <td>50.601667</td>\n",
1065
       "      <td>0.0</td>\n",
1066
       "      <td>NaN</td>\n",
1067
       "      <td>NaN</td>\n",
1068
       "    </tr>\n",
1069
       "    <tr>\n",
1070
       "      <th>25</th>\n",
1071
       "      <td>2018-10-18</td>\n",
1072
       "      <td>1.696276e-06</td>\n",
1073
       "      <td>1.333564e-06</td>\n",
1074
       "      <td>NaN</td>\n",
1075
       "      <td>0.000003</td>\n",
1076
       "      <td>2.450028e-06</td>\n",
1077
       "      <td>NaN</td>\n",
1078
       "      <td>0.000003</td>\n",
1079
       "      <td>5.655112e-06</td>\n",
1080
       "      <td>NaN</td>\n",
1081
       "      <td>...</td>\n",
1082
       "      <td>68.986611</td>\n",
1083
       "      <td>15.483334</td>\n",
1084
       "      <td>76.583336</td>\n",
1085
       "      <td>1347.232662</td>\n",
1086
       "      <td>NaN</td>\n",
1087
       "      <td>NaN</td>\n",
1088
       "      <td>NaN</td>\n",
1089
       "      <td>NaN</td>\n",
1090
       "      <td>NaN</td>\n",
1091
       "      <td>NaN</td>\n",
1092
       "    </tr>\n",
1093
       "    <tr>\n",
1094
       "      <th>26</th>\n",
1095
       "      <td>2018-10-19</td>\n",
1096
       "      <td>2.643052e-06</td>\n",
1097
       "      <td>2.049523e-06</td>\n",
1098
       "      <td>NaN</td>\n",
1099
       "      <td>0.000003</td>\n",
1100
       "      <td>2.662817e-06</td>\n",
1101
       "      <td>NaN</td>\n",
1102
       "      <td>0.000003</td>\n",
1103
       "      <td>5.999171e-06</td>\n",
1104
       "      <td>NaN</td>\n",
1105
       "      <td>...</td>\n",
1106
       "      <td>78.343009</td>\n",
1107
       "      <td>11.849999</td>\n",
1108
       "      <td>86.750000</td>\n",
1109
       "      <td>1204.783340</td>\n",
1110
       "      <td>NaN</td>\n",
1111
       "      <td>NaN</td>\n",
1112
       "      <td>NaN</td>\n",
1113
       "      <td>NaN</td>\n",
1114
       "      <td>NaN</td>\n",
1115
       "      <td>NaN</td>\n",
1116
       "    </tr>\n",
1117
       "    <tr>\n",
1118
       "      <th>27</th>\n",
1119
       "      <td>2018-10-19</td>\n",
1120
       "      <td>-1.319548e-07</td>\n",
1121
       "      <td>-6.674203e-07</td>\n",
1122
       "      <td>NaN</td>\n",
1123
       "      <td>0.000005</td>\n",
1124
       "      <td>-4.296196e-07</td>\n",
1125
       "      <td>NaN</td>\n",
1126
       "      <td>0.000005</td>\n",
1127
       "      <td>1.068996e-06</td>\n",
1128
       "      <td>NaN</td>\n",
1129
       "      <td>...</td>\n",
1130
       "      <td>64.888729</td>\n",
1131
       "      <td>15.866667</td>\n",
1132
       "      <td>72.000000</td>\n",
1133
       "      <td>1298.070458</td>\n",
1134
       "      <td>NaN</td>\n",
1135
       "      <td>NaN</td>\n",
1136
       "      <td>NaN</td>\n",
1137
       "      <td>NaN</td>\n",
1138
       "      <td>NaN</td>\n",
1139
       "      <td>NaN</td>\n",
1140
       "    </tr>\n",
1141
       "    <tr>\n",
1142
       "      <th>28</th>\n",
1143
       "      <td>2018-10-20</td>\n",
1144
       "      <td>-1.332337e-06</td>\n",
1145
       "      <td>-1.943410e-06</td>\n",
1146
       "      <td>NaN</td>\n",
1147
       "      <td>0.000006</td>\n",
1148
       "      <td>-1.712419e-06</td>\n",
1149
       "      <td>NaN</td>\n",
1150
       "      <td>0.000005</td>\n",
1151
       "      <td>1.355707e-07</td>\n",
1152
       "      <td>NaN</td>\n",
1153
       "      <td>...</td>\n",
1154
       "      <td>75.949176</td>\n",
1155
       "      <td>7.075000</td>\n",
1156
       "      <td>95.500000</td>\n",
1157
       "      <td>961.637716</td>\n",
1158
       "      <td>NaN</td>\n",
1159
       "      <td>NaN</td>\n",
1160
       "      <td>NaN</td>\n",
1161
       "      <td>NaN</td>\n",
1162
       "      <td>NaN</td>\n",
1163
       "      <td>NaN</td>\n",
1164
       "    </tr>\n",
1165
       "    <tr>\n",
1166
       "      <th>29</th>\n",
1167
       "      <td>2018-10-20</td>\n",
1168
       "      <td>1.969945e-06</td>\n",
1169
       "      <td>1.431171e-06</td>\n",
1170
       "      <td>NaN</td>\n",
1171
       "      <td>0.000003</td>\n",
1172
       "      <td>2.750630e-06</td>\n",
1173
       "      <td>NaN</td>\n",
1174
       "      <td>0.000003</td>\n",
1175
       "      <td>6.083674e-06</td>\n",
1176
       "      <td>NaN</td>\n",
1177
       "      <td>...</td>\n",
1178
       "      <td>58.713717</td>\n",
1179
       "      <td>14.366667</td>\n",
1180
       "      <td>63.166668</td>\n",
1181
       "      <td>1034.099888</td>\n",
1182
       "      <td>NaN</td>\n",
1183
       "      <td>NaN</td>\n",
1184
       "      <td>NaN</td>\n",
1185
       "      <td>NaN</td>\n",
1186
       "      <td>NaN</td>\n",
1187
       "      <td>NaN</td>\n",
1188
       "    </tr>\n",
1189
       "    <tr>\n",
1190
       "      <th>30</th>\n",
1191
       "      <td>2018-10-21</td>\n",
1192
       "      <td>1.810997e-06</td>\n",
1193
       "      <td>1.365175e-06</td>\n",
1194
       "      <td>NaN</td>\n",
1195
       "      <td>0.000005</td>\n",
1196
       "      <td>2.487162e-06</td>\n",
1197
       "      <td>NaN</td>\n",
1198
       "      <td>0.000004</td>\n",
1199
       "      <td>6.123559e-06</td>\n",
1200
       "      <td>NaN</td>\n",
1201
       "      <td>...</td>\n",
1202
       "      <td>77.954818</td>\n",
1203
       "      <td>5.383333</td>\n",
1204
       "      <td>91.916664</td>\n",
1205
       "      <td>823.388241</td>\n",
1206
       "      <td>NaN</td>\n",
1207
       "      <td>NaN</td>\n",
1208
       "      <td>NaN</td>\n",
1209
       "      <td>NaN</td>\n",
1210
       "      <td>NaN</td>\n",
1211
       "      <td>NaN</td>\n",
1212
       "    </tr>\n",
1213
       "    <tr>\n",
1214
       "      <th>31</th>\n",
1215
       "      <td>2018-10-21</td>\n",
1216
       "      <td>-1.732660e-06</td>\n",
1217
       "      <td>-2.282520e-06</td>\n",
1218
       "      <td>NaN</td>\n",
1219
       "      <td>0.000004</td>\n",
1220
       "      <td>-2.034108e-06</td>\n",
1221
       "      <td>NaN</td>\n",
1222
       "      <td>0.000004</td>\n",
1223
       "      <td>-1.025116e-06</td>\n",
1224
       "      <td>NaN</td>\n",
1225
       "      <td>...</td>\n",
1226
       "      <td>60.671882</td>\n",
1227
       "      <td>15.341667</td>\n",
1228
       "      <td>62.250000</td>\n",
1229
       "      <td>1085.177392</td>\n",
1230
       "      <td>NaN</td>\n",
1231
       "      <td>NaN</td>\n",
1232
       "      <td>NaN</td>\n",
1233
       "      <td>NaN</td>\n",
1234
       "      <td>NaN</td>\n",
1235
       "      <td>NaN</td>\n",
1236
       "    </tr>\n",
1237
       "    <tr>\n",
1238
       "      <th>32</th>\n",
1239
       "      <td>2018-10-22</td>\n",
1240
       "      <td>-1.100335e-06</td>\n",
1241
       "      <td>-1.913171e-06</td>\n",
1242
       "      <td>NaN</td>\n",
1243
       "      <td>0.000005</td>\n",
1244
       "      <td>-1.609247e-06</td>\n",
1245
       "      <td>NaN</td>\n",
1246
       "      <td>0.000005</td>\n",
1247
       "      <td>2.947903e-07</td>\n",
1248
       "      <td>NaN</td>\n",
1249
       "      <td>...</td>\n",
1250
       "      <td>90.282846</td>\n",
1251
       "      <td>12.816667</td>\n",
1252
       "      <td>91.416664</td>\n",
1253
       "      <td>1352.931970</td>\n",
1254
       "      <td>NaN</td>\n",
1255
       "      <td>NaN</td>\n",
1256
       "      <td>NaN</td>\n",
1257
       "      <td>NaN</td>\n",
1258
       "      <td>NaN</td>\n",
1259
       "      <td>NaN</td>\n",
1260
       "    </tr>\n",
1261
       "    <tr>\n",
1262
       "      <th>33</th>\n",
1263
       "      <td>2018-10-22</td>\n",
1264
       "      <td>-5.490189e-07</td>\n",
1265
       "      <td>-9.766282e-07</td>\n",
1266
       "      <td>NaN</td>\n",
1267
       "      <td>0.000005</td>\n",
1268
       "      <td>-6.847724e-07</td>\n",
1269
       "      <td>NaN</td>\n",
1270
       "      <td>0.000005</td>\n",
1271
       "      <td>8.822850e-07</td>\n",
1272
       "      <td>NaN</td>\n",
1273
       "      <td>...</td>\n",
1274
       "      <td>51.921047</td>\n",
1275
       "      <td>14.325000</td>\n",
1276
       "      <td>59.000000</td>\n",
1277
       "      <td>963.286852</td>\n",
1278
       "      <td>NaN</td>\n",
1279
       "      <td>NaN</td>\n",
1280
       "      <td>NaN</td>\n",
1281
       "      <td>NaN</td>\n",
1282
       "      <td>NaN</td>\n",
1283
       "      <td>NaN</td>\n",
1284
       "    </tr>\n",
1285
       "    <tr>\n",
1286
       "      <th>34</th>\n",
1287
       "      <td>2018-10-24</td>\n",
1288
       "      <td>1.784753e-06</td>\n",
1289
       "      <td>1.555411e-06</td>\n",
1290
       "      <td>NaN</td>\n",
1291
       "      <td>0.000003</td>\n",
1292
       "      <td>2.193270e-06</td>\n",
1293
       "      <td>NaN</td>\n",
1294
       "      <td>0.000002</td>\n",
1295
       "      <td>4.541856e-06</td>\n",
1296
       "      <td>NaN</td>\n",
1297
       "      <td>...</td>\n",
1298
       "      <td>86.378121</td>\n",
1299
       "      <td>14.766666</td>\n",
1300
       "      <td>87.500000</td>\n",
1301
       "      <td>1469.951907</td>\n",
1302
       "      <td>NaN</td>\n",
1303
       "      <td>NaN</td>\n",
1304
       "      <td>NaN</td>\n",
1305
       "      <td>NaN</td>\n",
1306
       "      <td>NaN</td>\n",
1307
       "      <td>NaN</td>\n",
1308
       "    </tr>\n",
1309
       "    <tr>\n",
1310
       "      <th>35</th>\n",
1311
       "      <td>2018-10-24</td>\n",
1312
       "      <td>8.190939e-07</td>\n",
1313
       "      <td>5.508098e-07</td>\n",
1314
       "      <td>NaN</td>\n",
1315
       "      <td>0.000006</td>\n",
1316
       "      <td>1.043012e-06</td>\n",
1317
       "      <td>NaN</td>\n",
1318
       "      <td>0.000005</td>\n",
1319
       "      <td>4.216968e-06</td>\n",
1320
       "      <td>NaN</td>\n",
1321
       "      <td>...</td>\n",
1322
       "      <td>85.035832</td>\n",
1323
       "      <td>14.500000</td>\n",
1324
       "      <td>88.750000</td>\n",
1325
       "      <td>1465.504286</td>\n",
1326
       "      <td>NaN</td>\n",
1327
       "      <td>NaN</td>\n",
1328
       "      <td>NaN</td>\n",
1329
       "      <td>NaN</td>\n",
1330
       "      <td>NaN</td>\n",
1331
       "      <td>NaN</td>\n",
1332
       "    </tr>\n",
1333
       "    <tr>\n",
1334
       "      <th>36</th>\n",
1335
       "      <td>2018-10-25</td>\n",
1336
       "      <td>3.724496e-06</td>\n",
1337
       "      <td>3.241454e-06</td>\n",
1338
       "      <td>NaN</td>\n",
1339
       "      <td>0.000003</td>\n",
1340
       "      <td>4.705916e-06</td>\n",
1341
       "      <td>NaN</td>\n",
1342
       "      <td>0.000002</td>\n",
1343
       "      <td>8.929031e-06</td>\n",
1344
       "      <td>NaN</td>\n",
1345
       "      <td>...</td>\n",
1346
       "      <td>72.341495</td>\n",
1347
       "      <td>11.650001</td>\n",
1348
       "      <td>78.166664</td>\n",
1349
       "      <td>1071.325174</td>\n",
1350
       "      <td>NaN</td>\n",
1351
       "      <td>NaN</td>\n",
1352
       "      <td>NaN</td>\n",
1353
       "      <td>NaN</td>\n",
1354
       "      <td>NaN</td>\n",
1355
       "      <td>NaN</td>\n",
1356
       "    </tr>\n",
1357
       "    <tr>\n",
1358
       "      <th>37</th>\n",
1359
       "      <td>2018-10-25</td>\n",
1360
       "      <td>1.824806e-06</td>\n",
1361
       "      <td>1.196929e-06</td>\n",
1362
       "      <td>NaN</td>\n",
1363
       "      <td>0.000003</td>\n",
1364
       "      <td>2.209937e-06</td>\n",
1365
       "      <td>NaN</td>\n",
1366
       "      <td>0.000003</td>\n",
1367
       "      <td>5.299628e-06</td>\n",
1368
       "      <td>NaN</td>\n",
1369
       "      <td>...</td>\n",
1370
       "      <td>68.176070</td>\n",
1371
       "      <td>12.483334</td>\n",
1372
       "      <td>73.083336</td>\n",
1373
       "      <td>1058.211217</td>\n",
1374
       "      <td>NaN</td>\n",
1375
       "      <td>NaN</td>\n",
1376
       "      <td>NaN</td>\n",
1377
       "      <td>NaN</td>\n",
1378
       "      <td>NaN</td>\n",
1379
       "      <td>NaN</td>\n",
1380
       "    </tr>\n",
1381
       "    <tr>\n",
1382
       "      <th>38</th>\n",
1383
       "      <td>2018-10-26</td>\n",
1384
       "      <td>2.153363e-06</td>\n",
1385
       "      <td>2.132159e-06</td>\n",
1386
       "      <td>NaN</td>\n",
1387
       "      <td>0.000003</td>\n",
1388
       "      <td>2.389443e-06</td>\n",
1389
       "      <td>NaN</td>\n",
1390
       "      <td>0.000002</td>\n",
1391
       "      <td>4.990096e-06</td>\n",
1392
       "      <td>NaN</td>\n",
1393
       "      <td>...</td>\n",
1394
       "      <td>78.287534</td>\n",
1395
       "      <td>10.116667</td>\n",
1396
       "      <td>83.916664</td>\n",
1397
       "      <td>1038.558421</td>\n",
1398
       "      <td>NaN</td>\n",
1399
       "      <td>NaN</td>\n",
1400
       "      <td>NaN</td>\n",
1401
       "      <td>NaN</td>\n",
1402
       "      <td>NaN</td>\n",
1403
       "      <td>NaN</td>\n",
1404
       "    </tr>\n",
1405
       "    <tr>\n",
1406
       "      <th>39</th>\n",
1407
       "      <td>2018-10-26</td>\n",
1408
       "      <td>1.326535e-06</td>\n",
1409
       "      <td>7.106164e-07</td>\n",
1410
       "      <td>NaN</td>\n",
1411
       "      <td>0.000008</td>\n",
1412
       "      <td>8.805592e-07</td>\n",
1413
       "      <td>NaN</td>\n",
1414
       "      <td>0.000008</td>\n",
1415
       "      <td>3.677825e-06</td>\n",
1416
       "      <td>NaN</td>\n",
1417
       "      <td>...</td>\n",
1418
       "      <td>79.999436</td>\n",
1419
       "      <td>9.926667</td>\n",
1420
       "      <td>89.250000</td>\n",
1421
       "      <td>1090.588126</td>\n",
1422
       "      <td>1.235000</td>\n",
1423
       "      <td>0.000000</td>\n",
1424
       "      <td>0.056667</td>\n",
1425
       "      <td>1.1</td>\n",
1426
       "      <td>NaN</td>\n",
1427
       "      <td>NaN</td>\n",
1428
       "    </tr>\n",
1429
       "    <tr>\n",
1430
       "      <th>40</th>\n",
1431
       "      <td>2018-10-27</td>\n",
1432
       "      <td>3.636625e-06</td>\n",
1433
       "      <td>2.991667e-06</td>\n",
1434
       "      <td>NaN</td>\n",
1435
       "      <td>0.000005</td>\n",
1436
       "      <td>3.793937e-06</td>\n",
1437
       "      <td>NaN</td>\n",
1438
       "      <td>0.000004</td>\n",
1439
       "      <td>7.498736e-06</td>\n",
1440
       "      <td>NaN</td>\n",
1441
       "      <td>...</td>\n",
1442
       "      <td>85.339351</td>\n",
1443
       "      <td>5.366667</td>\n",
1444
       "      <td>94.416664</td>\n",
1445
       "      <td>844.802221</td>\n",
1446
       "      <td>61.010000</td>\n",
1447
       "      <td>56.300000</td>\n",
1448
       "      <td>13.606667</td>\n",
1449
       "      <td>0.0</td>\n",
1450
       "      <td>NaN</td>\n",
1451
       "      <td>NaN</td>\n",
1452
       "    </tr>\n",
1453
       "    <tr>\n",
1454
       "      <th>41</th>\n",
1455
       "      <td>2018-10-27</td>\n",
1456
       "      <td>-6.211330e-07</td>\n",
1457
       "      <td>-9.717194e-07</td>\n",
1458
       "      <td>NaN</td>\n",
1459
       "      <td>0.000004</td>\n",
1460
       "      <td>-9.310713e-07</td>\n",
1461
       "      <td>NaN</td>\n",
1462
       "      <td>0.000004</td>\n",
1463
       "      <td>6.339895e-07</td>\n",
1464
       "      <td>NaN</td>\n",
1465
       "      <td>...</td>\n",
1466
       "      <td>79.924031</td>\n",
1467
       "      <td>7.693333</td>\n",
1468
       "      <td>86.166664</td>\n",
1469
       "      <td>905.187480</td>\n",
1470
       "      <td>1.633333</td>\n",
1471
       "      <td>1.825000</td>\n",
1472
       "      <td>0.000000</td>\n",
1473
       "      <td>0.0</td>\n",
1474
       "      <td>NaN</td>\n",
1475
       "      <td>NaN</td>\n",
1476
       "    </tr>\n",
1477
       "    <tr>\n",
1478
       "      <th>42</th>\n",
1479
       "      <td>2018-10-28</td>\n",
1480
       "      <td>4.497817e-06</td>\n",
1481
       "      <td>4.283923e-06</td>\n",
1482
       "      <td>NaN</td>\n",
1483
       "      <td>0.000004</td>\n",
1484
       "      <td>4.852430e-06</td>\n",
1485
       "      <td>NaN</td>\n",
1486
       "      <td>0.000003</td>\n",
1487
       "      <td>8.562411e-06</td>\n",
1488
       "      <td>NaN</td>\n",
1489
       "      <td>...</td>\n",
1490
       "      <td>82.718420</td>\n",
1491
       "      <td>3.806667</td>\n",
1492
       "      <td>87.666664</td>\n",
1493
       "      <td>703.161433</td>\n",
1494
       "      <td>102.038333</td>\n",
1495
       "      <td>94.306667</td>\n",
1496
       "      <td>17.771667</td>\n",
1497
       "      <td>0.0</td>\n",
1498
       "      <td>NaN</td>\n",
1499
       "      <td>NaN</td>\n",
1500
       "    </tr>\n",
1501
       "    <tr>\n",
1502
       "      <th>43</th>\n",
1503
       "      <td>2018-10-28</td>\n",
1504
       "      <td>-1.333735e-06</td>\n",
1505
       "      <td>-1.513523e-06</td>\n",
1506
       "      <td>NaN</td>\n",
1507
       "      <td>0.000005</td>\n",
1508
       "      <td>-1.296741e-06</td>\n",
1509
       "      <td>NaN</td>\n",
1510
       "      <td>0.000004</td>\n",
1511
       "      <td>3.020331e-07</td>\n",
1512
       "      <td>NaN</td>\n",
1513
       "      <td>...</td>\n",
1514
       "      <td>64.977425</td>\n",
1515
       "      <td>5.376667</td>\n",
1516
       "      <td>75.416664</td>\n",
1517
       "      <td>675.267940</td>\n",
1518
       "      <td>0.015000</td>\n",
1519
       "      <td>0.015000</td>\n",
1520
       "      <td>0.366667</td>\n",
1521
       "      <td>0.0</td>\n",
1522
       "      <td>NaN</td>\n",
1523
       "      <td>NaN</td>\n",
1524
       "    </tr>\n",
1525
       "    <tr>\n",
1526
       "      <th>44</th>\n",
1527
       "      <td>2018-10-29</td>\n",
1528
       "      <td>-5.603311e-07</td>\n",
1529
       "      <td>-1.228439e-06</td>\n",
1530
       "      <td>NaN</td>\n",
1531
       "      <td>0.000006</td>\n",
1532
       "      <td>-1.040336e-06</td>\n",
1533
       "      <td>NaN</td>\n",
1534
       "      <td>0.000005</td>\n",
1535
       "      <td>9.589513e-07</td>\n",
1536
       "      <td>NaN</td>\n",
1537
       "      <td>...</td>\n",
1538
       "      <td>81.862039</td>\n",
1539
       "      <td>4.883333</td>\n",
1540
       "      <td>86.166664</td>\n",
1541
       "      <td>745.416323</td>\n",
1542
       "      <td>51.123333</td>\n",
1543
       "      <td>48.155000</td>\n",
1544
       "      <td>0.085000</td>\n",
1545
       "      <td>0.0</td>\n",
1546
       "      <td>NaN</td>\n",
1547
       "      <td>NaN</td>\n",
1548
       "    </tr>\n",
1549
       "    <tr>\n",
1550
       "      <th>45</th>\n",
1551
       "      <td>2018-10-29</td>\n",
1552
       "      <td>1.156162e-06</td>\n",
1553
       "      <td>7.338229e-07</td>\n",
1554
       "      <td>NaN</td>\n",
1555
       "      <td>0.000007</td>\n",
1556
       "      <td>6.615397e-07</td>\n",
1557
       "      <td>NaN</td>\n",
1558
       "      <td>0.000007</td>\n",
1559
       "      <td>3.020624e-06</td>\n",
1560
       "      <td>NaN</td>\n",
1561
       "      <td>...</td>\n",
1562
       "      <td>77.330572</td>\n",
1563
       "      <td>6.280000</td>\n",
1564
       "      <td>81.666664</td>\n",
1565
       "      <td>778.518557</td>\n",
1566
       "      <td>0.691667</td>\n",
1567
       "      <td>0.011667</td>\n",
1568
       "      <td>0.133333</td>\n",
1569
       "      <td>0.0</td>\n",
1570
       "      <td>NaN</td>\n",
1571
       "      <td>NaN</td>\n",
1572
       "    </tr>\n",
1573
       "    <tr>\n",
1574
       "      <th>46</th>\n",
1575
       "      <td>2018-10-30</td>\n",
1576
       "      <td>-5.832049e-07</td>\n",
1577
       "      <td>-1.367379e-06</td>\n",
1578
       "      <td>NaN</td>\n",
1579
       "      <td>0.000005</td>\n",
1580
       "      <td>-1.198896e-06</td>\n",
1581
       "      <td>NaN</td>\n",
1582
       "      <td>0.000005</td>\n",
1583
       "      <td>6.190209e-07</td>\n",
1584
       "      <td>NaN</td>\n",
1585
       "      <td>...</td>\n",
1586
       "      <td>90.119412</td>\n",
1587
       "      <td>4.605000</td>\n",
1588
       "      <td>93.416664</td>\n",
1589
       "      <td>792.542864</td>\n",
1590
       "      <td>89.415000</td>\n",
1591
       "      <td>83.198333</td>\n",
1592
       "      <td>0.101667</td>\n",
1593
       "      <td>0.0</td>\n",
1594
       "      <td>NaN</td>\n",
1595
       "      <td>NaN</td>\n",
1596
       "    </tr>\n",
1597
       "    <tr>\n",
1598
       "      <th>47</th>\n",
1599
       "      <td>2018-10-30</td>\n",
1600
       "      <td>6.831304e-07</td>\n",
1601
       "      <td>-1.583820e-07</td>\n",
1602
       "      <td>NaN</td>\n",
1603
       "      <td>0.000005</td>\n",
1604
       "      <td>1.502555e-08</td>\n",
1605
       "      <td>NaN</td>\n",
1606
       "      <td>0.000005</td>\n",
1607
       "      <td>1.761219e-06</td>\n",
1608
       "      <td>NaN</td>\n",
1609
       "      <td>...</td>\n",
1610
       "      <td>89.176624</td>\n",
1611
       "      <td>9.105000</td>\n",
1612
       "      <td>89.000000</td>\n",
1613
       "      <td>1029.029277</td>\n",
1614
       "      <td>1.580000</td>\n",
1615
       "      <td>0.000000</td>\n",
1616
       "      <td>0.031667</td>\n",
1617
       "      <td>0.0</td>\n",
1618
       "      <td>NaN</td>\n",
1619
       "      <td>NaN</td>\n",
1620
       "    </tr>\n",
1621
       "    <tr>\n",
1622
       "      <th>48</th>\n",
1623
       "      <td>2018-10-31</td>\n",
1624
       "      <td>-2.640546e-07</td>\n",
1625
       "      <td>-1.038990e-06</td>\n",
1626
       "      <td>NaN</td>\n",
1627
       "      <td>0.000005</td>\n",
1628
       "      <td>-1.141497e-06</td>\n",
1629
       "      <td>NaN</td>\n",
1630
       "      <td>0.000005</td>\n",
1631
       "      <td>7.637132e-07</td>\n",
1632
       "      <td>NaN</td>\n",
1633
       "      <td>...</td>\n",
1634
       "      <td>84.420349</td>\n",
1635
       "      <td>6.031667</td>\n",
1636
       "      <td>88.916664</td>\n",
1637
       "      <td>833.193491</td>\n",
1638
       "      <td>168.916667</td>\n",
1639
       "      <td>132.145000</td>\n",
1640
       "      <td>157.476667</td>\n",
1641
       "      <td>0.0</td>\n",
1642
       "      <td>NaN</td>\n",
1643
       "      <td>NaN</td>\n",
1644
       "    </tr>\n",
1645
       "    <tr>\n",
1646
       "      <th>49</th>\n",
1647
       "      <td>2018-10-31</td>\n",
1648
       "      <td>4.328737e-07</td>\n",
1649
       "      <td>-5.693961e-09</td>\n",
1650
       "      <td>NaN</td>\n",
1651
       "      <td>0.000006</td>\n",
1652
       "      <td>1.244246e-07</td>\n",
1653
       "      <td>NaN</td>\n",
1654
       "      <td>0.000006</td>\n",
1655
       "      <td>2.026151e-06</td>\n",
1656
       "      <td>NaN</td>\n",
1657
       "      <td>...</td>\n",
1658
       "      <td>82.939124</td>\n",
1659
       "      <td>10.496667</td>\n",
1660
       "      <td>88.500000</td>\n",
1661
       "      <td>1123.467763</td>\n",
1662
       "      <td>0.000000</td>\n",
1663
       "      <td>0.028333</td>\n",
1664
       "      <td>0.430000</td>\n",
1665
       "      <td>0.0</td>\n",
1666
       "      <td>NaN</td>\n",
1667
       "      <td>NaN</td>\n",
1668
       "    </tr>\n",
1669
       "  </tbody>\n",
1670
       "</table>\n",
1671
       "<p>50 rows × 28 columns</p>\n",
1672
       "</div>"
1673
      ],
1674
      "text/plain": [
1675
       "     timestamp      strain_1      strain_2  strain_3  strain_4      strain_5  \\\n",
1676
       "0   2018-10-02  1.804882e-06  1.291150e-06       NaN  0.000003           NaN   \n",
1677
       "1   2018-10-03  2.269802e-06  1.698958e-06       NaN  0.000004           NaN   \n",
1678
       "2   2018-10-03  2.128605e-06  1.411400e-06       NaN  0.000003           NaN   \n",
1679
       "3   2018-10-04  3.457613e-06  2.919155e-06       NaN  0.000004           NaN   \n",
1680
       "4   2018-10-04  1.420150e-07 -5.852899e-07       NaN  0.000005           NaN   \n",
1681
       "5   2018-10-05  1.282716e-06  2.430030e-07       NaN  0.000008           NaN   \n",
1682
       "6   2018-10-05 -3.599416e-07 -1.080711e-06       NaN  0.000005           NaN   \n",
1683
       "7   2018-10-06  3.045380e-06  2.472536e-06       NaN  0.000006           NaN   \n",
1684
       "8   2018-10-08 -4.537585e-07 -1.072013e-06       NaN  0.000006           NaN   \n",
1685
       "9   2018-10-08 -1.061381e-07 -7.471682e-07       NaN  0.000005           NaN   \n",
1686
       "10  2018-10-09  1.628155e-06  1.257122e-06       NaN  0.000004           NaN   \n",
1687
       "11  2018-10-09 -3.682028e-07 -1.007747e-06       NaN  0.000005           NaN   \n",
1688
       "12  2018-10-10 -4.486108e-07 -1.049204e-06       NaN  0.000005           NaN   \n",
1689
       "13  2018-10-10 -3.506244e-07 -9.312912e-07       NaN  0.000004 -8.837225e-07   \n",
1690
       "14  2018-10-11  9.078712e-08 -6.254588e-07       NaN  0.000007 -5.223130e-07   \n",
1691
       "15  2018-10-11 -5.495572e-07 -1.042136e-06       NaN  0.000005 -6.461451e-07   \n",
1692
       "16  2018-10-12  2.827529e-06  2.354601e-06       NaN  0.000004  3.245773e-06   \n",
1693
       "17  2018-10-12  1.409051e-06  8.248487e-07       NaN  0.000006  1.552718e-06   \n",
1694
       "18  2018-10-15  2.527285e-06  2.073035e-06       NaN  0.000002  2.815451e-06   \n",
1695
       "19  2018-10-15 -4.270678e-07 -1.003826e-06       NaN  0.000005 -6.829385e-07   \n",
1696
       "20  2018-10-16  1.935912e-06  1.531248e-06       NaN  0.000004  2.574173e-06   \n",
1697
       "21  2018-10-16 -3.912998e-07 -9.402715e-07       NaN  0.000005 -8.452086e-07   \n",
1698
       "22  2018-10-17  2.287292e-06  1.759895e-06       NaN  0.000004  2.737282e-06   \n",
1699
       "23  2018-10-17 -6.658138e-07 -1.174673e-06       NaN  0.000006 -9.838982e-07   \n",
1700
       "24  2018-10-18  1.756547e-06  1.209365e-06       NaN  0.000004  2.360669e-06   \n",
1701
       "25  2018-10-18  1.696276e-06  1.333564e-06       NaN  0.000003  2.450028e-06   \n",
1702
       "26  2018-10-19  2.643052e-06  2.049523e-06       NaN  0.000003  2.662817e-06   \n",
1703
       "27  2018-10-19 -1.319548e-07 -6.674203e-07       NaN  0.000005 -4.296196e-07   \n",
1704
       "28  2018-10-20 -1.332337e-06 -1.943410e-06       NaN  0.000006 -1.712419e-06   \n",
1705
       "29  2018-10-20  1.969945e-06  1.431171e-06       NaN  0.000003  2.750630e-06   \n",
1706
       "30  2018-10-21  1.810997e-06  1.365175e-06       NaN  0.000005  2.487162e-06   \n",
1707
       "31  2018-10-21 -1.732660e-06 -2.282520e-06       NaN  0.000004 -2.034108e-06   \n",
1708
       "32  2018-10-22 -1.100335e-06 -1.913171e-06       NaN  0.000005 -1.609247e-06   \n",
1709
       "33  2018-10-22 -5.490189e-07 -9.766282e-07       NaN  0.000005 -6.847724e-07   \n",
1710
       "34  2018-10-24  1.784753e-06  1.555411e-06       NaN  0.000003  2.193270e-06   \n",
1711
       "35  2018-10-24  8.190939e-07  5.508098e-07       NaN  0.000006  1.043012e-06   \n",
1712
       "36  2018-10-25  3.724496e-06  3.241454e-06       NaN  0.000003  4.705916e-06   \n",
1713
       "37  2018-10-25  1.824806e-06  1.196929e-06       NaN  0.000003  2.209937e-06   \n",
1714
       "38  2018-10-26  2.153363e-06  2.132159e-06       NaN  0.000003  2.389443e-06   \n",
1715
       "39  2018-10-26  1.326535e-06  7.106164e-07       NaN  0.000008  8.805592e-07   \n",
1716
       "40  2018-10-27  3.636625e-06  2.991667e-06       NaN  0.000005  3.793937e-06   \n",
1717
       "41  2018-10-27 -6.211330e-07 -9.717194e-07       NaN  0.000004 -9.310713e-07   \n",
1718
       "42  2018-10-28  4.497817e-06  4.283923e-06       NaN  0.000004  4.852430e-06   \n",
1719
       "43  2018-10-28 -1.333735e-06 -1.513523e-06       NaN  0.000005 -1.296741e-06   \n",
1720
       "44  2018-10-29 -5.603311e-07 -1.228439e-06       NaN  0.000006 -1.040336e-06   \n",
1721
       "45  2018-10-29  1.156162e-06  7.338229e-07       NaN  0.000007  6.615397e-07   \n",
1722
       "46  2018-10-30 -5.832049e-07 -1.367379e-06       NaN  0.000005 -1.198896e-06   \n",
1723
       "47  2018-10-30  6.831304e-07 -1.583820e-07       NaN  0.000005  1.502555e-08   \n",
1724
       "48  2018-10-31 -2.640546e-07 -1.038990e-06       NaN  0.000005 -1.141497e-06   \n",
1725
       "49  2018-10-31  4.328737e-07 -5.693961e-09       NaN  0.000006  1.244246e-07   \n",
1726
       "\n",
1727
       "    strain_6  strain_7      strain_8  strain_9  ...         Rh    airtemp  \\\n",
1728
       "0        NaN  0.000003  5.482034e-06       NaN  ...  71.280029  16.716667   \n",
1729
       "1        NaN  0.000003  5.813794e-06       NaN  ...  76.997064  12.141666   \n",
1730
       "2        NaN  0.000002  5.213818e-06       NaN  ...  55.975091  15.683333   \n",
1731
       "3        NaN  0.000004  8.611123e-06       NaN  ...  79.072215  12.958333   \n",
1732
       "4        NaN  0.000005  7.968894e-07       NaN  ...  58.432998  21.924999   \n",
1733
       "5        NaN  0.000007  4.326709e-06       NaN  ...  77.300284   9.525000   \n",
1734
       "6        NaN  0.000004  1.512664e-06       NaN  ...  47.062426  23.875000   \n",
1735
       "7        NaN  0.000005  6.635354e-06       NaN  ...  78.543308  11.433333   \n",
1736
       "8        NaN  0.000005  8.118908e-07       NaN  ...  73.230142   5.833333   \n",
1737
       "9        NaN  0.000005  6.869932e-07       NaN  ...  52.548953  15.975000   \n",
1738
       "10       NaN  0.000004  5.748393e-06       NaN  ...  77.955239   6.358333   \n",
1739
       "11       NaN  0.000005  5.841734e-07       NaN  ...  56.269163  18.052333   \n",
1740
       "12       NaN  0.000005  4.158732e-07       NaN  ...  81.122389   9.398639   \n",
1741
       "13       NaN  0.000004  5.287465e-07       NaN  ...  54.889717  23.548417   \n",
1742
       "14       NaN  0.000007  1.800594e-06       NaN  ...  72.342233  19.004861   \n",
1743
       "15       NaN  0.000005  8.852473e-07       NaN  ...  53.908886  24.208334   \n",
1744
       "16       NaN  0.000004  6.803631e-06       NaN  ...  83.950116  17.993750   \n",
1745
       "17       NaN  0.000006  5.098572e-06       NaN  ...  64.288978  23.465000   \n",
1746
       "18       NaN  0.000002  4.371978e-06       NaN  ...  59.638465  19.570000   \n",
1747
       "19       NaN  0.000005  7.821662e-07       NaN  ...  41.219275  22.181667   \n",
1748
       "20       NaN  0.000003  6.310965e-06       NaN  ...  71.332262  11.291667   \n",
1749
       "21       NaN  0.000005  8.549726e-07       NaN  ...  43.499465  22.855000   \n",
1750
       "22       NaN  0.000004  5.843397e-06       NaN  ...  75.164982  11.135000   \n",
1751
       "23       NaN  0.000005  8.058195e-07       NaN  ...  65.386193  18.858334   \n",
1752
       "24       NaN  0.000003  5.703489e-06       NaN  ...  84.501079  12.526667   \n",
1753
       "25       NaN  0.000003  5.655112e-06       NaN  ...  68.986611  15.483334   \n",
1754
       "26       NaN  0.000003  5.999171e-06       NaN  ...  78.343009  11.849999   \n",
1755
       "27       NaN  0.000005  1.068996e-06       NaN  ...  64.888729  15.866667   \n",
1756
       "28       NaN  0.000005  1.355707e-07       NaN  ...  75.949176   7.075000   \n",
1757
       "29       NaN  0.000003  6.083674e-06       NaN  ...  58.713717  14.366667   \n",
1758
       "30       NaN  0.000004  6.123559e-06       NaN  ...  77.954818   5.383333   \n",
1759
       "31       NaN  0.000004 -1.025116e-06       NaN  ...  60.671882  15.341667   \n",
1760
       "32       NaN  0.000005  2.947903e-07       NaN  ...  90.282846  12.816667   \n",
1761
       "33       NaN  0.000005  8.822850e-07       NaN  ...  51.921047  14.325000   \n",
1762
       "34       NaN  0.000002  4.541856e-06       NaN  ...  86.378121  14.766666   \n",
1763
       "35       NaN  0.000005  4.216968e-06       NaN  ...  85.035832  14.500000   \n",
1764
       "36       NaN  0.000002  8.929031e-06       NaN  ...  72.341495  11.650001   \n",
1765
       "37       NaN  0.000003  5.299628e-06       NaN  ...  68.176070  12.483334   \n",
1766
       "38       NaN  0.000002  4.990096e-06       NaN  ...  78.287534  10.116667   \n",
1767
       "39       NaN  0.000008  3.677825e-06       NaN  ...  79.999436   9.926667   \n",
1768
       "40       NaN  0.000004  7.498736e-06       NaN  ...  85.339351   5.366667   \n",
1769
       "41       NaN  0.000004  6.339895e-07       NaN  ...  79.924031   7.693333   \n",
1770
       "42       NaN  0.000003  8.562411e-06       NaN  ...  82.718420   3.806667   \n",
1771
       "43       NaN  0.000004  3.020331e-07       NaN  ...  64.977425   5.376667   \n",
1772
       "44       NaN  0.000005  9.589513e-07       NaN  ...  81.862039   4.883333   \n",
1773
       "45       NaN  0.000007  3.020624e-06       NaN  ...  77.330572   6.280000   \n",
1774
       "46       NaN  0.000005  6.190209e-07       NaN  ...  90.119412   4.605000   \n",
1775
       "47       NaN  0.000005  1.761219e-06       NaN  ...  89.176624   9.105000   \n",
1776
       "48       NaN  0.000005  7.637132e-07       NaN  ...  84.420349   6.031667   \n",
1777
       "49       NaN  0.000006  2.026151e-06       NaN  ...  82.939124  10.496667   \n",
1778
       "\n",
1779
       "        avgRh       avgVPr       avgGR       avgdR      avgdnr  totalrain  \\\n",
1780
       "0   74.500000  1417.871951         NaN         NaN         NaN        NaN   \n",
1781
       "1   79.166664  1120.819324         NaN         NaN         NaN        NaN   \n",
1782
       "2   61.250000  1091.387360         NaN         NaN         NaN        NaN   \n",
1783
       "3   83.083336  1241.060048         NaN         NaN         NaN        NaN   \n",
1784
       "4   54.500000  1433.934434         NaN         NaN         NaN        NaN   \n",
1785
       "5   92.833336  1104.173129         NaN         NaN         NaN        NaN   \n",
1786
       "6   45.583332  1349.343321         NaN         NaN         NaN        NaN   \n",
1787
       "7   90.500000  1222.699295         NaN         NaN         NaN        NaN   \n",
1788
       "8   91.916664   849.545823         NaN         NaN         NaN        NaN   \n",
1789
       "9   56.000000  1016.622559         NaN         NaN         NaN        NaN   \n",
1790
       "10  92.833336   889.771595         NaN         NaN         NaN        NaN   \n",
1791
       "11  57.583332  1192.356382   20.417556   18.671694   16.358833        0.0   \n",
1792
       "12  93.750000  1105.629785  157.019694   66.948917  407.837417        0.0   \n",
1793
       "13  56.416668  1637.594616   30.327806   16.180389   63.654694        0.0   \n",
1794
       "14  76.500000  1681.335790   31.314111   27.076306    0.377667        0.0   \n",
1795
       "15  55.916668  1688.607212         NaN         NaN         NaN        NaN   \n",
1796
       "16  89.166664  1839.557833  140.983056   78.890306  214.392639        0.0   \n",
1797
       "17  67.250000  1942.281645   30.878333   27.683333    9.416667        0.0   \n",
1798
       "18  63.250000  1439.851964   90.183333   85.575000    3.056667        0.0   \n",
1799
       "19  44.416668  1187.027705    9.636667   12.235000    0.311667        0.0   \n",
1800
       "20  86.583336  1158.849084  149.348333   65.840000  435.375000        0.0   \n",
1801
       "21  40.916668  1139.047585   22.431667   25.788333    0.680000        0.0   \n",
1802
       "22  90.833336  1203.156142  126.298333   78.948333  177.325000        0.0   \n",
1803
       "23  71.166664  1549.889447         NaN         NaN         NaN        NaN   \n",
1804
       "24  94.500000  1372.213888  104.860000   89.093333   50.601667        0.0   \n",
1805
       "25  76.583336  1347.232662         NaN         NaN         NaN        NaN   \n",
1806
       "26  86.750000  1204.783340         NaN         NaN         NaN        NaN   \n",
1807
       "27  72.000000  1298.070458         NaN         NaN         NaN        NaN   \n",
1808
       "28  95.500000   961.637716         NaN         NaN         NaN        NaN   \n",
1809
       "29  63.166668  1034.099888         NaN         NaN         NaN        NaN   \n",
1810
       "30  91.916664   823.388241         NaN         NaN         NaN        NaN   \n",
1811
       "31  62.250000  1085.177392         NaN         NaN         NaN        NaN   \n",
1812
       "32  91.416664  1352.931970         NaN         NaN         NaN        NaN   \n",
1813
       "33  59.000000   963.286852         NaN         NaN         NaN        NaN   \n",
1814
       "34  87.500000  1469.951907         NaN         NaN         NaN        NaN   \n",
1815
       "35  88.750000  1465.504286         NaN         NaN         NaN        NaN   \n",
1816
       "36  78.166664  1071.325174         NaN         NaN         NaN        NaN   \n",
1817
       "37  73.083336  1058.211217         NaN         NaN         NaN        NaN   \n",
1818
       "38  83.916664  1038.558421         NaN         NaN         NaN        NaN   \n",
1819
       "39  89.250000  1090.588126    1.235000    0.000000    0.056667        1.1   \n",
1820
       "40  94.416664   844.802221   61.010000   56.300000   13.606667        0.0   \n",
1821
       "41  86.166664   905.187480    1.633333    1.825000    0.000000        0.0   \n",
1822
       "42  87.666664   703.161433  102.038333   94.306667   17.771667        0.0   \n",
1823
       "43  75.416664   675.267940    0.015000    0.015000    0.366667        0.0   \n",
1824
       "44  86.166664   745.416323   51.123333   48.155000    0.085000        0.0   \n",
1825
       "45  81.666664   778.518557    0.691667    0.011667    0.133333        0.0   \n",
1826
       "46  93.416664   792.542864   89.415000   83.198333    0.101667        0.0   \n",
1827
       "47  89.000000  1029.029277    1.580000    0.000000    0.031667        0.0   \n",
1828
       "48  88.916664   833.193491  168.916667  132.145000  157.476667        0.0   \n",
1829
       "49  88.500000  1123.467763    0.000000    0.028333    0.430000        0.0   \n",
1830
       "\n",
1831
       "    avgws10  avgwd10  \n",
1832
       "0       NaN      NaN  \n",
1833
       "1       NaN      NaN  \n",
1834
       "2       NaN      NaN  \n",
1835
       "3       NaN      NaN  \n",
1836
       "4       NaN      NaN  \n",
1837
       "5       NaN      NaN  \n",
1838
       "6       NaN      NaN  \n",
1839
       "7       NaN      NaN  \n",
1840
       "8       NaN      NaN  \n",
1841
       "9       NaN      NaN  \n",
1842
       "10      NaN      NaN  \n",
1843
       "11      NaN      NaN  \n",
1844
       "12      NaN      NaN  \n",
1845
       "13      NaN      NaN  \n",
1846
       "14      NaN      NaN  \n",
1847
       "15      NaN      NaN  \n",
1848
       "16      NaN      NaN  \n",
1849
       "17      NaN      NaN  \n",
1850
       "18      NaN      NaN  \n",
1851
       "19      NaN      NaN  \n",
1852
       "20      NaN      NaN  \n",
1853
       "21      NaN      NaN  \n",
1854
       "22      NaN      NaN  \n",
1855
       "23      NaN      NaN  \n",
1856
       "24      NaN      NaN  \n",
1857
       "25      NaN      NaN  \n",
1858
       "26      NaN      NaN  \n",
1859
       "27      NaN      NaN  \n",
1860
       "28      NaN      NaN  \n",
1861
       "29      NaN      NaN  \n",
1862
       "30      NaN      NaN  \n",
1863
       "31      NaN      NaN  \n",
1864
       "32      NaN      NaN  \n",
1865
       "33      NaN      NaN  \n",
1866
       "34      NaN      NaN  \n",
1867
       "35      NaN      NaN  \n",
1868
       "36      NaN      NaN  \n",
1869
       "37      NaN      NaN  \n",
1870
       "38      NaN      NaN  \n",
1871
       "39      NaN      NaN  \n",
1872
       "40      NaN      NaN  \n",
1873
       "41      NaN      NaN  \n",
1874
       "42      NaN      NaN  \n",
1875
       "43      NaN      NaN  \n",
1876
       "44      NaN      NaN  \n",
1877
       "45      NaN      NaN  \n",
1878
       "46      NaN      NaN  \n",
1879
       "47      NaN      NaN  \n",
1880
       "48      NaN      NaN  \n",
1881
       "49      NaN      NaN  \n",
1882
       "\n",
1883
       "[50 rows x 28 columns]"
1884
      ]
1885
     },
1886
     "execution_count": 38,
1887
     "metadata": {},
1888
     "output_type": "execute_result"
1889
    }
1890
   ],
1891
   "source": [
1892
    "df1"
1893
   ]
1894
  },
1895
  {
1896
   "cell_type": "code",
1897
   "execution_count": null,
1898
   "id": "ffd1ac20",
1899
   "metadata": {},
1900
   "outputs": [],
1901
   "source": [
1902
    "#looping to include all data in april month\n",
1903
    "#latest\n",
1904
    "for j in range(len(arr2)):\n",
1905
    "    strain = []\n",
1906
    "    time = []\n",
1907
    "    mat = scipy.io.loadmat('./traindata_201904/'+arr2[j])\n",
1908
    "    for item in mat['predat_sg'][0][0][3]:\n",
1909
    "        strain.append(item)\n",
1910
    "    for item in mat['predat_sg'][0][0][0]:\n",
1911
    "        #convert matlab time to date_timestamp before appending \n",
1912
    "        time.append(pd.to_datetime(item-719529,unit='d').round('s')[0].date())\n",
1913
    "    if j==0:\n",
1914
    "        col_name = []\n",
1915
    "        for i in range (1,17):\n",
1916
    "            col_name.append(\"strain_\"+str(i))\n",
1917
    "    \n",
1918
    "        #create datafrome to add the strain values\n",
1919
    "        strain_apr = pd.DataFrame(strain, columns=col_name)\n",
1920
    "        strain_apr.insert(0, 'timestamp', time)\n",
1921
    "        strain_apr = strain_apr.groupby(['timestamp']).mean()\n",
1922
    "        strain_apr['Surftemp'] = mat['predat_env'][0][0][-1][0][0] #Surface temperature at one point below deck\n",
1923
    "        strain_apr['Rh'] = mat['predat_env'][0][0][-1][0][1] #Relative humidity at one point below deck\n",
1924
    "        strain_apr['airtemp'] = mat['predat_env'][0][0][-1][0][2] #Average air temperature\n",
1925
    "        strain_apr['avgRh'] = mat['predat_env'][0][0][-1][0][3] #Average Relative Humidity\n",
1926
    "        strain_apr['avgVPr'] = mat['predat_env'][0][0][-1][0][4] #Average Vapour Pressure\n",
1927
    "        strain_apr['avgGR'] = mat['predat_env'][0][0][-1][0][5] #Average global Radiation\n",
1928
    "        strain_apr['avgdR']= mat['predat_env'][0][0][-1][0][6] #Average diffuse radiation\n",
1929
    "        strain_apr['avgdnr'] = mat['predat_env'][0][0][-1][0][7] #Average Direct normal radiation\n",
1930
    "        strain_apr['totalrain'] = mat['predat_env'][0][0][-1][0][8] #Total Rain\n",
1931
    "        strain_apr['avgws10'] = mat['predat_env'][0][0][-1][0][9] #wind speed at 10m above ground\n",
1932
    "        strain_apr['avgwd10'] = mat['predat_env'][0][0][-1][0][10] #wind direction at 10m above ground\n",
1933
    "        \n",
1934
    "    else:\n",
1935
    "        temp = pd.DataFrame(strain, columns=col_name)\n",
1936
    "        temp.insert(0,'timestamp',time)\n",
1937
    "        temp = temp.groupby(['timestamp']).mean()\n",
1938
    "        temp['Surftemp'] = mat['predat_env'][0][0][-1][0][0] #Surface temperature at one point below deck\n",
1939
    "        temp['Rh'] = mat['predat_env'][0][0][-1][0][1] #Relative humidity at one point below deck\n",
1940
    "        temp['airtemp'] = mat['predat_env'][0][0][-1][0][2] #Average air temperature\n",
1941
    "        temp['avgRh'] = mat['predat_env'][0][0][-1][0][3] #Average Relative Humidity\n",
1942
    "        temp['avgVPr'] = mat['predat_env'][0][0][-1][0][4] #Average Vapour Pressure\n",
1943
    "        temp['avgGR'] = mat['predat_env'][0][0][-1][0][5] #Average global Radiation\n",
1944
    "        temp['avgdR']= mat['predat_env'][0][0][-1][0][6] #Average diffuse radiation\n",
1945
    "        temp['avgdnr'] = mat['predat_env'][0][0][-1][0][7] #Average Direct normal radiation\n",
1946
    "        temp['totalrain'] = mat['predat_env'][0][0][-1][0][8] #Total Rain\n",
1947
    "        temp['avgws10'] = mat['predat_env'][0][0][-1][0][9] #wind speed at 10m above ground\n",
1948
    "        temp['avgwd10'] = mat['predat_env'][0][0][-1][0][10] #wind direction at 10m above ground\n",
1949
    "        strain_apr = strain_apr.append(temp)\n",
1950
    "\n",
1951
    "#save the dataframe to CSV file\n",
1952
    "strain_apr.to_csv('daywise_apr_with_env.csv')"
1953
   ]
1954
  },
1955
  {
1956
   "cell_type": "code",
1957
   "execution_count": null,
1958
   "id": "5ca8e23c",
1959
   "metadata": {},
1960
   "outputs": [],
1961
   "source": [
1962
    "#run multivariate VAR\n",
1963
    "\n",
1964
    "\n",
1965
    "import pandas as pd\n",
1966
    "import matplotlib.pyplot as plt\n",
1967
    "%matplotlib inline\n",
1968
    "import numpy as np\n",
1969
    "from sklearn.model_selection import train_test_split\n",
1970
    "\n",
1971
    "#read the data\n",
1972
    "df = pd.read_csv(\"AirQualityUCI.csv\", parse_dates=[['Date', 'Time']])\n",
1973
    "\n",
1974
    "#check the dtypes\n",
1975
    "df.dtypes\n",
1976
    "\n",
1977
    "#missing value treatment\n",
1978
    "cols = data.columns\n",
1979
    "for j in cols:\n",
1980
    "    for i in range(0,len(data)):\n",
1981
    "        if data[j][i] == -200:\n",
1982
    "            data[j][i] = data[j][i-1]\n",
1983
    "\n",
1984
    "#checking stationarity\n",
1985
    "from statsmodels.tsa.vector_ar.vecm import coint_johansen\n",
1986
    "#since the test works for only 12 variables, I have randomly dropped\n",
1987
    "#in the next iteration, I would drop another and check the eigenvalues\n",
1988
    "johan_test_temp = data.drop([ 'CO(GT)'], axis=1)\n",
1989
    "coint_johansen(johan_test_temp,-1,1).eig\n",
1990
    "\n",
1991
    "#creating the train and validation set\n",
1992
    "train = data[:int(0.8*(len(data)))]\n",
1993
    "valid = data[int(0.8*(len(data))):]\n",
1994
    "\n",
1995
    "#fit the model\n",
1996
    "from statsmodels.tsa.vector_ar.var_model import VAR\n",
1997
    "\n",
1998
    "model = VAR(endog=train)\n",
1999
    "model_fit = model.fit()\n",
2000
    "\n",
2001
    "# make prediction on validation\n",
2002
    "prediction = model_fit.forecast(model_fit.y, steps=len(valid))\n",
2003
    "\n",
2004
    "#converting predictions to dataframe\n",
2005
    "pred = pd.DataFrame(index=range(0,len(prediction)),columns=[cols])\n",
2006
    "for j in range(0,13):\n",
2007
    "    for i in range(0, len(prediction)):\n",
2008
    "        pred.iloc[i][j] = prediction[i][j]\n",
2009
    "\n",
2010
    "#check rmse\n",
2011
    "for i in cols:\n",
2012
    "    print('rmse value for', i, 'is : ', sqrt(mean_squared_error(pred[i], valid[i])))\n",
2013
    "\n",
2014
    "#make final predictions\n",
2015
    "model = VAR(endog=data)\n",
2016
    "model_fit = model.fit()\n",
2017
    "yhat = model_fit.forecast(model_fit.y, steps=1)\n",
2018
    "print(yhat)"
2019
   ]
2020
  },
2021
  {
2022
   "cell_type": "code",
2023
   "execution_count": 3,
2024
   "id": "87347b7d",
2025
   "metadata": {},
2026
   "outputs": [],
2027
   "source": [
2028
    "df1 = pd.read_csv(\"daywise_apr.csv\")\n",
2029
    "df2 = pd.read_csv(\"daywise_oct.csv\")"
2030
   ]
2031
  },
2032
  {
2033
   "cell_type": "code",
2034
   "execution_count": 24,
2035
   "id": "c454d88f",
2036
   "metadata": {},
2037
   "outputs": [],
2038
   "source": [
2039
    "df3 = df2.append(df1, ignore_index=True)"
2040
   ]
2041
  },
2042
  {
2043
   "cell_type": "code",
2044
   "execution_count": 22,
2045
   "id": "a51bb4ae",
2046
   "metadata": {},
2047
   "outputs": [
2048
    {
2049
     "data": {
2050
      "text/html": [
2051
       "<div>\n",
2052
       "<style scoped>\n",
2053
       "    .dataframe tbody tr th:only-of-type {\n",
2054
       "        vertical-align: middle;\n",
2055
       "    }\n",
2056
       "\n",
2057
       "    .dataframe tbody tr th {\n",
2058
       "        vertical-align: top;\n",
2059
       "    }\n",
2060
       "\n",
2061
       "    .dataframe thead th {\n",
2062
       "        text-align: right;\n",
2063
       "    }\n",
2064
       "</style>\n",
2065
       "<table border=\"1\" class=\"dataframe\">\n",
2066
       "  <thead>\n",
2067
       "    <tr style=\"text-align: right;\">\n",
2068
       "      <th></th>\n",
2069
       "      <th>timestamp</th>\n",
2070
       "      <th>strain_1</th>\n",
2071
       "      <th>strain_2</th>\n",
2072
       "      <th>strain_3</th>\n",
2073
       "      <th>strain_4</th>\n",
2074
       "      <th>strain_5</th>\n",
2075
       "      <th>strain_6</th>\n",
2076
       "      <th>strain_7</th>\n",
2077
       "      <th>strain_8</th>\n",
2078
       "      <th>strain_9</th>\n",
2079
       "      <th>strain_10</th>\n",
2080
       "      <th>strain_11</th>\n",
2081
       "      <th>strain_12</th>\n",
2082
       "      <th>strain_13</th>\n",
2083
       "      <th>strain_14</th>\n",
2084
       "      <th>strain_15</th>\n",
2085
       "      <th>strain_16</th>\n",
2086
       "    </tr>\n",
2087
       "  </thead>\n",
2088
       "  <tbody>\n",
2089
       "    <tr>\n",
2090
       "      <th>0</th>\n",
2091
       "      <td>2018-10-02</td>\n",
2092
       "      <td>1.804882e-06</td>\n",
2093
       "      <td>1.291150e-06</td>\n",
2094
       "      <td>NaN</td>\n",
2095
       "      <td>0.000003</td>\n",
2096
       "      <td>NaN</td>\n",
2097
       "      <td>NaN</td>\n",
2098
       "      <td>0.000003</td>\n",
2099
       "      <td>5.482034e-06</td>\n",
2100
       "      <td>NaN</td>\n",
2101
       "      <td>NaN</td>\n",
2102
       "      <td>NaN</td>\n",
2103
       "      <td>NaN</td>\n",
2104
       "      <td>NaN</td>\n",
2105
       "      <td>NaN</td>\n",
2106
       "      <td>NaN</td>\n",
2107
       "      <td>NaN</td>\n",
2108
       "    </tr>\n",
2109
       "    <tr>\n",
2110
       "      <th>1</th>\n",
2111
       "      <td>2018-10-03</td>\n",
2112
       "      <td>2.269802e-06</td>\n",
2113
       "      <td>1.698958e-06</td>\n",
2114
       "      <td>NaN</td>\n",
2115
       "      <td>0.000004</td>\n",
2116
       "      <td>NaN</td>\n",
2117
       "      <td>NaN</td>\n",
2118
       "      <td>0.000003</td>\n",
2119
       "      <td>5.813794e-06</td>\n",
2120
       "      <td>NaN</td>\n",
2121
       "      <td>NaN</td>\n",
2122
       "      <td>NaN</td>\n",
2123
       "      <td>NaN</td>\n",
2124
       "      <td>NaN</td>\n",
2125
       "      <td>NaN</td>\n",
2126
       "      <td>NaN</td>\n",
2127
       "      <td>NaN</td>\n",
2128
       "    </tr>\n",
2129
       "    <tr>\n",
2130
       "      <th>2</th>\n",
2131
       "      <td>2018-10-03</td>\n",
2132
       "      <td>2.128605e-06</td>\n",
2133
       "      <td>1.411400e-06</td>\n",
2134
       "      <td>NaN</td>\n",
2135
       "      <td>0.000003</td>\n",
2136
       "      <td>NaN</td>\n",
2137
       "      <td>NaN</td>\n",
2138
       "      <td>0.000002</td>\n",
2139
       "      <td>5.213818e-06</td>\n",
2140
       "      <td>NaN</td>\n",
2141
       "      <td>NaN</td>\n",
2142
       "      <td>NaN</td>\n",
2143
       "      <td>NaN</td>\n",
2144
       "      <td>NaN</td>\n",
2145
       "      <td>NaN</td>\n",
2146
       "      <td>NaN</td>\n",
2147
       "      <td>NaN</td>\n",
2148
       "    </tr>\n",
2149
       "    <tr>\n",
2150
       "      <th>3</th>\n",
2151
       "      <td>2018-10-04</td>\n",
2152
       "      <td>3.457613e-06</td>\n",
2153
       "      <td>2.919155e-06</td>\n",
2154
       "      <td>NaN</td>\n",
2155
       "      <td>0.000004</td>\n",
2156
       "      <td>NaN</td>\n",
2157
       "      <td>NaN</td>\n",
2158
       "      <td>0.000004</td>\n",
2159
       "      <td>8.611123e-06</td>\n",
2160
       "      <td>NaN</td>\n",
2161
       "      <td>NaN</td>\n",
2162
       "      <td>NaN</td>\n",
2163
       "      <td>NaN</td>\n",
2164
       "      <td>NaN</td>\n",
2165
       "      <td>NaN</td>\n",
2166
       "      <td>NaN</td>\n",
2167
       "      <td>NaN</td>\n",
2168
       "    </tr>\n",
2169
       "    <tr>\n",
2170
       "      <th>4</th>\n",
2171
       "      <td>2018-10-04</td>\n",
2172
       "      <td>1.420150e-07</td>\n",
2173
       "      <td>-5.852899e-07</td>\n",
2174
       "      <td>NaN</td>\n",
2175
       "      <td>0.000005</td>\n",
2176
       "      <td>NaN</td>\n",
2177
       "      <td>NaN</td>\n",
2178
       "      <td>0.000005</td>\n",
2179
       "      <td>7.968894e-07</td>\n",
2180
       "      <td>NaN</td>\n",
2181
       "      <td>NaN</td>\n",
2182
       "      <td>NaN</td>\n",
2183
       "      <td>NaN</td>\n",
2184
       "      <td>NaN</td>\n",
2185
       "      <td>NaN</td>\n",
2186
       "      <td>NaN</td>\n",
2187
       "      <td>NaN</td>\n",
2188
       "    </tr>\n",
2189
       "    <tr>\n",
2190
       "      <th>...</th>\n",
2191
       "      <td>...</td>\n",
2192
       "      <td>...</td>\n",
2193
       "      <td>...</td>\n",
2194
       "      <td>...</td>\n",
2195
       "      <td>...</td>\n",
2196
       "      <td>...</td>\n",
2197
       "      <td>...</td>\n",
2198
       "      <td>...</td>\n",
2199
       "      <td>...</td>\n",
2200
       "      <td>...</td>\n",
2201
       "      <td>...</td>\n",
2202
       "      <td>...</td>\n",
2203
       "      <td>...</td>\n",
2204
       "      <td>...</td>\n",
2205
       "      <td>...</td>\n",
2206
       "      <td>...</td>\n",
2207
       "      <td>...</td>\n",
2208
       "    </tr>\n",
2209
       "    <tr>\n",
2210
       "      <th>75</th>\n",
2211
       "      <td>2019-04-26</td>\n",
2212
       "      <td>-3.124659e-07</td>\n",
2213
       "      <td>-9.232934e-07</td>\n",
2214
       "      <td>-1.002870e-06</td>\n",
2215
       "      <td>0.000007</td>\n",
2216
       "      <td>-6.356581e-07</td>\n",
2217
       "      <td>-3.183168e-07</td>\n",
2218
       "      <td>0.000006</td>\n",
2219
       "      <td>1.193259e-06</td>\n",
2220
       "      <td>1.174737e-06</td>\n",
2221
       "      <td>1.245790e-06</td>\n",
2222
       "      <td>1.115366e-06</td>\n",
2223
       "      <td>1.164278e-06</td>\n",
2224
       "      <td>3.411089e-09</td>\n",
2225
       "      <td>1.196962e-07</td>\n",
2226
       "      <td>-3.273108e-07</td>\n",
2227
       "      <td>-1.667888e-06</td>\n",
2228
       "    </tr>\n",
2229
       "    <tr>\n",
2230
       "      <th>76</th>\n",
2231
       "      <td>2019-04-27</td>\n",
2232
       "      <td>2.549993e-07</td>\n",
2233
       "      <td>7.168742e-08</td>\n",
2234
       "      <td>-8.060298e-09</td>\n",
2235
       "      <td>0.000002</td>\n",
2236
       "      <td>5.027693e-08</td>\n",
2237
       "      <td>1.492946e-07</td>\n",
2238
       "      <td>0.000002</td>\n",
2239
       "      <td>6.433991e-07</td>\n",
2240
       "      <td>3.332187e-07</td>\n",
2241
       "      <td>3.612386e-07</td>\n",
2242
       "      <td>2.934336e-07</td>\n",
2243
       "      <td>3.209738e-07</td>\n",
2244
       "      <td>-3.559686e-08</td>\n",
2245
       "      <td>3.452330e-08</td>\n",
2246
       "      <td>-4.634966e-07</td>\n",
2247
       "      <td>-9.167307e-08</td>\n",
2248
       "    </tr>\n",
2249
       "    <tr>\n",
2250
       "      <th>77</th>\n",
2251
       "      <td>2019-04-28</td>\n",
2252
       "      <td>8.590041e-07</td>\n",
2253
       "      <td>6.393356e-07</td>\n",
2254
       "      <td>7.047048e-07</td>\n",
2255
       "      <td>0.000002</td>\n",
2256
       "      <td>1.048512e-06</td>\n",
2257
       "      <td>1.398638e-06</td>\n",
2258
       "      <td>0.000002</td>\n",
2259
       "      <td>2.602460e-06</td>\n",
2260
       "      <td>1.278090e-06</td>\n",
2261
       "      <td>1.505590e-06</td>\n",
2262
       "      <td>1.261098e-06</td>\n",
2263
       "      <td>1.437868e-06</td>\n",
2264
       "      <td>2.817936e-07</td>\n",
2265
       "      <td>6.031811e-08</td>\n",
2266
       "      <td>-1.552841e-07</td>\n",
2267
       "      <td>2.520299e-07</td>\n",
2268
       "    </tr>\n",
2269
       "    <tr>\n",
2270
       "      <th>78</th>\n",
2271
       "      <td>2019-04-29</td>\n",
2272
       "      <td>1.962889e-06</td>\n",
2273
       "      <td>1.290465e-06</td>\n",
2274
       "      <td>1.197580e-06</td>\n",
2275
       "      <td>0.000004</td>\n",
2276
       "      <td>1.593252e-06</td>\n",
2277
       "      <td>2.089498e-06</td>\n",
2278
       "      <td>0.000004</td>\n",
2279
       "      <td>3.852848e-06</td>\n",
2280
       "      <td>2.024704e-06</td>\n",
2281
       "      <td>2.109126e-06</td>\n",
2282
       "      <td>1.913340e-06</td>\n",
2283
       "      <td>2.073502e-06</td>\n",
2284
       "      <td>4.534765e-07</td>\n",
2285
       "      <td>6.241088e-08</td>\n",
2286
       "      <td>9.231739e-07</td>\n",
2287
       "      <td>-5.676041e-07</td>\n",
2288
       "    </tr>\n",
2289
       "    <tr>\n",
2290
       "      <th>79</th>\n",
2291
       "      <td>2019-04-30</td>\n",
2292
       "      <td>5.546739e-07</td>\n",
2293
       "      <td>3.677712e-08</td>\n",
2294
       "      <td>-2.769599e-08</td>\n",
2295
       "      <td>0.000004</td>\n",
2296
       "      <td>4.224754e-07</td>\n",
2297
       "      <td>9.494376e-07</td>\n",
2298
       "      <td>0.000004</td>\n",
2299
       "      <td>2.824605e-06</td>\n",
2300
       "      <td>1.739321e-06</td>\n",
2301
       "      <td>2.144481e-06</td>\n",
2302
       "      <td>1.680042e-06</td>\n",
2303
       "      <td>2.033107e-06</td>\n",
2304
       "      <td>7.093554e-07</td>\n",
2305
       "      <td>5.049996e-07</td>\n",
2306
       "      <td>-2.126916e-07</td>\n",
2307
       "      <td>2.013945e-07</td>\n",
2308
       "    </tr>\n",
2309
       "  </tbody>\n",
2310
       "</table>\n",
2311
       "<p>80 rows × 17 columns</p>\n",
2312
       "</div>"
2313
      ],
2314
      "text/plain": [
2315
       "     timestamp      strain_1      strain_2      strain_3  strain_4  \\\n",
2316
       "0   2018-10-02  1.804882e-06  1.291150e-06           NaN  0.000003   \n",
2317
       "1   2018-10-03  2.269802e-06  1.698958e-06           NaN  0.000004   \n",
2318
       "2   2018-10-03  2.128605e-06  1.411400e-06           NaN  0.000003   \n",
2319
       "3   2018-10-04  3.457613e-06  2.919155e-06           NaN  0.000004   \n",
2320
       "4   2018-10-04  1.420150e-07 -5.852899e-07           NaN  0.000005   \n",
2321
       "..         ...           ...           ...           ...       ...   \n",
2322
       "75  2019-04-26 -3.124659e-07 -9.232934e-07 -1.002870e-06  0.000007   \n",
2323
       "76  2019-04-27  2.549993e-07  7.168742e-08 -8.060298e-09  0.000002   \n",
2324
       "77  2019-04-28  8.590041e-07  6.393356e-07  7.047048e-07  0.000002   \n",
2325
       "78  2019-04-29  1.962889e-06  1.290465e-06  1.197580e-06  0.000004   \n",
2326
       "79  2019-04-30  5.546739e-07  3.677712e-08 -2.769599e-08  0.000004   \n",
2327
       "\n",
2328
       "        strain_5      strain_6  strain_7      strain_8      strain_9  \\\n",
2329
       "0            NaN           NaN  0.000003  5.482034e-06           NaN   \n",
2330
       "1            NaN           NaN  0.000003  5.813794e-06           NaN   \n",
2331
       "2            NaN           NaN  0.000002  5.213818e-06           NaN   \n",
2332
       "3            NaN           NaN  0.000004  8.611123e-06           NaN   \n",
2333
       "4            NaN           NaN  0.000005  7.968894e-07           NaN   \n",
2334
       "..           ...           ...       ...           ...           ...   \n",
2335
       "75 -6.356581e-07 -3.183168e-07  0.000006  1.193259e-06  1.174737e-06   \n",
2336
       "76  5.027693e-08  1.492946e-07  0.000002  6.433991e-07  3.332187e-07   \n",
2337
       "77  1.048512e-06  1.398638e-06  0.000002  2.602460e-06  1.278090e-06   \n",
2338
       "78  1.593252e-06  2.089498e-06  0.000004  3.852848e-06  2.024704e-06   \n",
2339
       "79  4.224754e-07  9.494376e-07  0.000004  2.824605e-06  1.739321e-06   \n",
2340
       "\n",
2341
       "       strain_10     strain_11     strain_12     strain_13     strain_14  \\\n",
2342
       "0            NaN           NaN           NaN           NaN           NaN   \n",
2343
       "1            NaN           NaN           NaN           NaN           NaN   \n",
2344
       "2            NaN           NaN           NaN           NaN           NaN   \n",
2345
       "3            NaN           NaN           NaN           NaN           NaN   \n",
2346
       "4            NaN           NaN           NaN           NaN           NaN   \n",
2347
       "..           ...           ...           ...           ...           ...   \n",
2348
       "75  1.245790e-06  1.115366e-06  1.164278e-06  3.411089e-09  1.196962e-07   \n",
2349
       "76  3.612386e-07  2.934336e-07  3.209738e-07 -3.559686e-08  3.452330e-08   \n",
2350
       "77  1.505590e-06  1.261098e-06  1.437868e-06  2.817936e-07  6.031811e-08   \n",
2351
       "78  2.109126e-06  1.913340e-06  2.073502e-06  4.534765e-07  6.241088e-08   \n",
2352
       "79  2.144481e-06  1.680042e-06  2.033107e-06  7.093554e-07  5.049996e-07   \n",
2353
       "\n",
2354
       "       strain_15     strain_16  \n",
2355
       "0            NaN           NaN  \n",
2356
       "1            NaN           NaN  \n",
2357
       "2            NaN           NaN  \n",
2358
       "3            NaN           NaN  \n",
2359
       "4            NaN           NaN  \n",
2360
       "..           ...           ...  \n",
2361
       "75 -3.273108e-07 -1.667888e-06  \n",
2362
       "76 -4.634966e-07 -9.167307e-08  \n",
2363
       "77 -1.552841e-07  2.520299e-07  \n",
2364
       "78  9.231739e-07 -5.676041e-07  \n",
2365
       "79 -2.126916e-07  2.013945e-07  \n",
2366
       "\n",
2367
       "[80 rows x 17 columns]"
2368
      ]
2369
     },
2370
     "execution_count": 22,
2371
     "metadata": {},
2372
     "output_type": "execute_result"
2373
    }
2374
   ],
2375
   "source": [
2376
    "df3"
2377
   ]
2378
  },
2379
  {
2380
   "cell_type": "code",
2381
   "execution_count": 19,
2382
   "id": "d58c2f0b",
2383
   "metadata": {},
2384
   "outputs": [],
2385
   "source": [
2386
    "df1 = df1.groupby(['timestamp']).mean().reset_index()"
2387
   ]
2388
  },
2389
  {
2390
   "cell_type": "code",
2391
   "execution_count": 23,
2392
   "id": "301e9de3",
2393
   "metadata": {},
2394
   "outputs": [],
2395
   "source": [
2396
    "df2 = df2.groupby(['timestamp']).mean().reset_index()"
2397
   ]
2398
  },
2399
  {
2400
   "cell_type": "code",
2401
   "execution_count": 26,
2402
   "id": "432c1f8b",
2403
   "metadata": {},
2404
   "outputs": [],
2405
   "source": [
2406
    "df5 = pd.read_csv('daywise_oct_with_env.csv')"
2407
   ]
2408
  },
2409
  {
2410
   "cell_type": "code",
2411
   "execution_count": 57,
2412
   "id": "8677b9f8",
2413
   "metadata": {},
2414
   "outputs": [],
2415
   "source": [
2416
    "strain_apr.to_csv('daywise_apr_with_env.csv')\n"
2417
   ]
2418
  },
2419
  {
2420
   "cell_type": "code",
2421
   "execution_count": 2,
2422
   "id": "7a66e87b",
2423
   "metadata": {},
2424
   "outputs": [],
2425
   "source": [
2426
    "dfa = pd.read_csv(\"daywise_apr_with_env.csv\")\n",
2427
    "dfo = pd.read_csv(\"daywise_oct_with_env2_final.csv\")"
2428
   ]
2429
  },
2430
  {
2431
   "cell_type": "code",
2432
   "execution_count": 3,
2433
   "id": "bf0a430f",
2434
   "metadata": {},
2435
   "outputs": [],
2436
   "source": [
2437
    "dfa = dfa.groupby('timestamp').mean()\n",
2438
    "dfa['retrofit'] = 0\n",
2439
    "dfo = dfo.groupby('timestamp').mean()\n",
2440
    "dfo['retrofit'] = 1"
2441
   ]
2442
  },
2443
  {
2444
   "cell_type": "code",
2445
   "execution_count": 4,
2446
   "id": "6def4f62",
2447
   "metadata": {},
2448
   "outputs": [],
2449
   "source": [
2450
    "dfall = dfa.append(dfo)"
2451
   ]
2452
  },
2453
  {
2454
   "cell_type": "code",
2455
   "execution_count": 5,
2456
   "id": "e1a1a671",
2457
   "metadata": {},
2458
   "outputs": [],
2459
   "source": [
2460
    "#dfall = dfall.reset_index()"
2461
   ]
2462
  },
2463
  {
2464
   "cell_type": "code",
2465
   "execution_count": 6,
2466
   "id": "0385d72f",
2467
   "metadata": {},
2468
   "outputs": [],
2469
   "source": [
2470
    "dfall = dfall.drop([\"strain_4\",\"strain_6\",\"strain_7\",\"strain_9\",\"strain_10\",\"strain_11\",\"strain_12\",\"strain_13\",\"strain_14\",\"strain_15\",\"strain_16\"], axis=1)"
2471
   ]
2472
  },
2473
  {
2474
   "cell_type": "code",
2475
   "execution_count": 7,
2476
   "id": "989b96db",
2477
   "metadata": {},
2478
   "outputs": [
2479
    {
2480
     "data": {
2481
      "text/html": [
2482
       "<div>\n",
2483
       "<style scoped>\n",
2484
       "    .dataframe tbody tr th:only-of-type {\n",
2485
       "        vertical-align: middle;\n",
2486
       "    }\n",
2487
       "\n",
2488
       "    .dataframe tbody tr th {\n",
2489
       "        vertical-align: top;\n",
2490
       "    }\n",
2491
       "\n",
2492
       "    .dataframe thead th {\n",
2493
       "        text-align: right;\n",
2494
       "    }\n",
2495
       "</style>\n",
2496
       "<table border=\"1\" class=\"dataframe\">\n",
2497
       "  <thead>\n",
2498
       "    <tr style=\"text-align: right;\">\n",
2499
       "      <th></th>\n",
2500
       "      <th>strain_1</th>\n",
2501
       "      <th>strain_2</th>\n",
2502
       "      <th>strain_3</th>\n",
2503
       "      <th>strain_5</th>\n",
2504
       "      <th>strain_8</th>\n",
2505
       "      <th>Surftemp</th>\n",
2506
       "      <th>Rh</th>\n",
2507
       "      <th>airtemp</th>\n",
2508
       "      <th>avgRh</th>\n",
2509
       "      <th>avgVPr</th>\n",
2510
       "      <th>avgGR</th>\n",
2511
       "      <th>avgdR</th>\n",
2512
       "      <th>avgdnr</th>\n",
2513
       "      <th>totalrain</th>\n",
2514
       "      <th>avgws10</th>\n",
2515
       "      <th>avgwd10</th>\n",
2516
       "      <th>retrofit</th>\n",
2517
       "    </tr>\n",
2518
       "    <tr>\n",
2519
       "      <th>timestamp</th>\n",
2520
       "      <th></th>\n",
2521
       "      <th></th>\n",
2522
       "      <th></th>\n",
2523
       "      <th></th>\n",
2524
       "      <th></th>\n",
2525
       "      <th></th>\n",
2526
       "      <th></th>\n",
2527
       "      <th></th>\n",
2528
       "      <th></th>\n",
2529
       "      <th></th>\n",
2530
       "      <th></th>\n",
2531
       "      <th></th>\n",
2532
       "      <th></th>\n",
2533
       "      <th></th>\n",
2534
       "      <th></th>\n",
2535
       "      <th></th>\n",
2536
       "      <th></th>\n",
2537
       "    </tr>\n",
2538
       "  </thead>\n",
2539
       "  <tbody>\n",
2540
       "    <tr>\n",
2541
       "      <th>2019-04-01</th>\n",
2542
       "      <td>1.391124e-06</td>\n",
2543
       "      <td>9.055422e-07</td>\n",
2544
       "      <td>7.714158e-07</td>\n",
2545
       "      <td>9.654413e-07</td>\n",
2546
       "      <td>2.746018e-06</td>\n",
2547
       "      <td>11.802222</td>\n",
2548
       "      <td>51.495514</td>\n",
2549
       "      <td>11.349167</td>\n",
2550
       "      <td>56.125002</td>\n",
2551
       "      <td>708.982498</td>\n",
2552
       "      <td>233.389167</td>\n",
2553
       "      <td>87.455833</td>\n",
2554
       "      <td>478.697500</td>\n",
2555
       "      <td>0.00</td>\n",
2556
       "      <td>3.335575</td>\n",
2557
       "      <td>37.478949</td>\n",
2558
       "      <td>0</td>\n",
2559
       "    </tr>\n",
2560
       "    <tr>\n",
2561
       "      <th>2019-04-02</th>\n",
2562
       "      <td>1.902302e-06</td>\n",
2563
       "      <td>1.393590e-06</td>\n",
2564
       "      <td>1.346971e-06</td>\n",
2565
       "      <td>1.786195e-06</td>\n",
2566
       "      <td>4.467735e-06</td>\n",
2567
       "      <td>11.776378</td>\n",
2568
       "      <td>72.111068</td>\n",
2569
       "      <td>10.497500</td>\n",
2570
       "      <td>77.708336</td>\n",
2571
       "      <td>985.274874</td>\n",
2572
       "      <td>87.955000</td>\n",
2573
       "      <td>83.221667</td>\n",
2574
       "      <td>2.445000</td>\n",
2575
       "      <td>0.05</td>\n",
2576
       "      <td>1.135126</td>\n",
2577
       "      <td>209.014923</td>\n",
2578
       "      <td>0</td>\n",
2579
       "    </tr>\n",
2580
       "    <tr>\n",
2581
       "      <th>2019-04-03</th>\n",
2582
       "      <td>7.411497e-07</td>\n",
2583
       "      <td>1.109817e-07</td>\n",
2584
       "      <td>7.233085e-08</td>\n",
2585
       "      <td>6.347549e-07</td>\n",
2586
       "      <td>3.083803e-06</td>\n",
2587
       "      <td>8.487706</td>\n",
2588
       "      <td>69.587566</td>\n",
2589
       "      <td>8.279167</td>\n",
2590
       "      <td>72.916666</td>\n",
2591
       "      <td>790.862084</td>\n",
2592
       "      <td>116.270833</td>\n",
2593
       "      <td>107.811667</td>\n",
2594
       "      <td>21.199167</td>\n",
2595
       "      <td>0.00</td>\n",
2596
       "      <td>1.599006</td>\n",
2597
       "      <td>141.619137</td>\n",
2598
       "      <td>0</td>\n",
2599
       "    </tr>\n",
2600
       "    <tr>\n",
2601
       "      <th>2019-04-04</th>\n",
2602
       "      <td>4.070716e-07</td>\n",
2603
       "      <td>-9.959862e-08</td>\n",
2604
       "      <td>-1.797842e-07</td>\n",
2605
       "      <td>-1.076326e-08</td>\n",
2606
       "      <td>1.905123e-06</td>\n",
2607
       "      <td>7.694840</td>\n",
2608
       "      <td>71.085618</td>\n",
2609
       "      <td>7.617500</td>\n",
2610
       "      <td>72.458332</td>\n",
2611
       "      <td>738.126551</td>\n",
2612
       "      <td>160.467500</td>\n",
2613
       "      <td>128.485000</td>\n",
2614
       "      <td>112.169167</td>\n",
2615
       "      <td>0.00</td>\n",
2616
       "      <td>1.181543</td>\n",
2617
       "      <td>178.318237</td>\n",
2618
       "      <td>0</td>\n",
2619
       "    </tr>\n",
2620
       "    <tr>\n",
2621
       "      <th>2019-04-05</th>\n",
2622
       "      <td>2.359754e-06</td>\n",
2623
       "      <td>1.851080e-06</td>\n",
2624
       "      <td>1.895205e-06</td>\n",
2625
       "      <td>2.641687e-06</td>\n",
2626
       "      <td>5.894953e-06</td>\n",
2627
       "      <td>9.097269</td>\n",
2628
       "      <td>66.807711</td>\n",
2629
       "      <td>9.810000</td>\n",
2630
       "      <td>71.999998</td>\n",
2631
       "      <td>846.904428</td>\n",
2632
       "      <td>225.915833</td>\n",
2633
       "      <td>94.376667</td>\n",
2634
       "      <td>376.993333</td>\n",
2635
       "      <td>0.00</td>\n",
2636
       "      <td>2.706478</td>\n",
2637
       "      <td>30.143506</td>\n",
2638
       "      <td>0</td>\n",
2639
       "    </tr>\n",
2640
       "    <tr>\n",
2641
       "      <th>...</th>\n",
2642
       "      <td>...</td>\n",
2643
       "      <td>...</td>\n",
2644
       "      <td>...</td>\n",
2645
       "      <td>...</td>\n",
2646
       "      <td>...</td>\n",
2647
       "      <td>...</td>\n",
2648
       "      <td>...</td>\n",
2649
       "      <td>...</td>\n",
2650
       "      <td>...</td>\n",
2651
       "      <td>...</td>\n",
2652
       "      <td>...</td>\n",
2653
       "      <td>...</td>\n",
2654
       "      <td>...</td>\n",
2655
       "      <td>...</td>\n",
2656
       "      <td>...</td>\n",
2657
       "      <td>...</td>\n",
2658
       "      <td>...</td>\n",
2659
       "    </tr>\n",
2660
       "    <tr>\n",
2661
       "      <th>2019-10-27</th>\n",
2662
       "      <td>-5.999584e-07</td>\n",
2663
       "      <td>-6.906911e-07</td>\n",
2664
       "      <td>-6.094068e-07</td>\n",
2665
       "      <td>-4.732139e-07</td>\n",
2666
       "      <td>1.166937e-07</td>\n",
2667
       "      <td>11.353086</td>\n",
2668
       "      <td>74.968842</td>\n",
2669
       "      <td>8.625833</td>\n",
2670
       "      <td>86.211667</td>\n",
2671
       "      <td>963.436168</td>\n",
2672
       "      <td>50.277500</td>\n",
2673
       "      <td>45.353333</td>\n",
2674
       "      <td>0.026667</td>\n",
2675
       "      <td>0.00</td>\n",
2676
       "      <td>0.675000</td>\n",
2677
       "      <td>212.700000</td>\n",
2678
       "      <td>1</td>\n",
2679
       "    </tr>\n",
2680
       "    <tr>\n",
2681
       "      <th>2019-10-28</th>\n",
2682
       "      <td>1.397000e-06</td>\n",
2683
       "      <td>9.859024e-07</td>\n",
2684
       "      <td>1.066181e-06</td>\n",
2685
       "      <td>2.024451e-06</td>\n",
2686
       "      <td>5.393001e-06</td>\n",
2687
       "      <td>9.467404</td>\n",
2688
       "      <td>80.369227</td>\n",
2689
       "      <td>6.798333</td>\n",
2690
       "      <td>90.648333</td>\n",
2691
       "      <td>895.893447</td>\n",
2692
       "      <td>95.483333</td>\n",
2693
       "      <td>30.701667</td>\n",
2694
       "      <td>225.355000</td>\n",
2695
       "      <td>0.00</td>\n",
2696
       "      <td>0.570000</td>\n",
2697
       "      <td>185.550000</td>\n",
2698
       "      <td>1</td>\n",
2699
       "    </tr>\n",
2700
       "    <tr>\n",
2701
       "      <th>2019-10-29</th>\n",
2702
       "      <td>-6.309372e-07</td>\n",
2703
       "      <td>-1.042560e-06</td>\n",
2704
       "      <td>-1.056013e-06</td>\n",
2705
       "      <td>-6.259414e-07</td>\n",
2706
       "      <td>1.546657e-06</td>\n",
2707
       "      <td>9.921486</td>\n",
2708
       "      <td>76.104669</td>\n",
2709
       "      <td>8.613333</td>\n",
2710
       "      <td>74.891667</td>\n",
2711
       "      <td>833.864494</td>\n",
2712
       "      <td>61.040000</td>\n",
2713
       "      <td>42.480833</td>\n",
2714
       "      <td>51.544167</td>\n",
2715
       "      <td>0.00</td>\n",
2716
       "      <td>1.270000</td>\n",
2717
       "      <td>36.745000</td>\n",
2718
       "      <td>1</td>\n",
2719
       "    </tr>\n",
2720
       "    <tr>\n",
2721
       "      <th>2019-10-30</th>\n",
2722
       "      <td>9.535004e-07</td>\n",
2723
       "      <td>6.590445e-07</td>\n",
2724
       "      <td>7.793678e-07</td>\n",
2725
       "      <td>1.486794e-06</td>\n",
2726
       "      <td>4.421555e-06</td>\n",
2727
       "      <td>7.566899</td>\n",
2728
       "      <td>77.632557</td>\n",
2729
       "      <td>6.325000</td>\n",
2730
       "      <td>78.035833</td>\n",
2731
       "      <td>745.242319</td>\n",
2732
       "      <td>32.364167</td>\n",
2733
       "      <td>29.780833</td>\n",
2734
       "      <td>0.000000</td>\n",
2735
       "      <td>0.00</td>\n",
2736
       "      <td>2.005000</td>\n",
2737
       "      <td>44.650000</td>\n",
2738
       "      <td>1</td>\n",
2739
       "    </tr>\n",
2740
       "    <tr>\n",
2741
       "      <th>2019-10-31</th>\n",
2742
       "      <td>9.887800e-07</td>\n",
2743
       "      <td>6.287566e-07</td>\n",
2744
       "      <td>7.288098e-07</td>\n",
2745
       "      <td>1.418339e-06</td>\n",
2746
       "      <td>4.201527e-06</td>\n",
2747
       "      <td>6.945136</td>\n",
2748
       "      <td>76.931039</td>\n",
2749
       "      <td>5.306667</td>\n",
2750
       "      <td>81.060000</td>\n",
2751
       "      <td>723.901020</td>\n",
2752
       "      <td>93.960000</td>\n",
2753
       "      <td>49.780000</td>\n",
2754
       "      <td>170.127500</td>\n",
2755
       "      <td>0.00</td>\n",
2756
       "      <td>1.125000</td>\n",
2757
       "      <td>53.745000</td>\n",
2758
       "      <td>1</td>\n",
2759
       "    </tr>\n",
2760
       "  </tbody>\n",
2761
       "</table>\n",
2762
       "<p>61 rows × 17 columns</p>\n",
2763
       "</div>"
2764
      ],
2765
      "text/plain": [
2766
       "                strain_1      strain_2      strain_3      strain_5  \\\n",
2767
       "timestamp                                                            \n",
2768
       "2019-04-01  1.391124e-06  9.055422e-07  7.714158e-07  9.654413e-07   \n",
2769
       "2019-04-02  1.902302e-06  1.393590e-06  1.346971e-06  1.786195e-06   \n",
2770
       "2019-04-03  7.411497e-07  1.109817e-07  7.233085e-08  6.347549e-07   \n",
2771
       "2019-04-04  4.070716e-07 -9.959862e-08 -1.797842e-07 -1.076326e-08   \n",
2772
       "2019-04-05  2.359754e-06  1.851080e-06  1.895205e-06  2.641687e-06   \n",
2773
       "...                  ...           ...           ...           ...   \n",
2774
       "2019-10-27 -5.999584e-07 -6.906911e-07 -6.094068e-07 -4.732139e-07   \n",
2775
       "2019-10-28  1.397000e-06  9.859024e-07  1.066181e-06  2.024451e-06   \n",
2776
       "2019-10-29 -6.309372e-07 -1.042560e-06 -1.056013e-06 -6.259414e-07   \n",
2777
       "2019-10-30  9.535004e-07  6.590445e-07  7.793678e-07  1.486794e-06   \n",
2778
       "2019-10-31  9.887800e-07  6.287566e-07  7.288098e-07  1.418339e-06   \n",
2779
       "\n",
2780
       "                strain_8   Surftemp         Rh    airtemp      avgRh  \\\n",
2781
       "timestamp                                                              \n",
2782
       "2019-04-01  2.746018e-06  11.802222  51.495514  11.349167  56.125002   \n",
2783
       "2019-04-02  4.467735e-06  11.776378  72.111068  10.497500  77.708336   \n",
2784
       "2019-04-03  3.083803e-06   8.487706  69.587566   8.279167  72.916666   \n",
2785
       "2019-04-04  1.905123e-06   7.694840  71.085618   7.617500  72.458332   \n",
2786
       "2019-04-05  5.894953e-06   9.097269  66.807711   9.810000  71.999998   \n",
2787
       "...                  ...        ...        ...        ...        ...   \n",
2788
       "2019-10-27  1.166937e-07  11.353086  74.968842   8.625833  86.211667   \n",
2789
       "2019-10-28  5.393001e-06   9.467404  80.369227   6.798333  90.648333   \n",
2790
       "2019-10-29  1.546657e-06   9.921486  76.104669   8.613333  74.891667   \n",
2791
       "2019-10-30  4.421555e-06   7.566899  77.632557   6.325000  78.035833   \n",
2792
       "2019-10-31  4.201527e-06   6.945136  76.931039   5.306667  81.060000   \n",
2793
       "\n",
2794
       "                avgVPr       avgGR       avgdR      avgdnr  totalrain  \\\n",
2795
       "timestamp                                                               \n",
2796
       "2019-04-01  708.982498  233.389167   87.455833  478.697500       0.00   \n",
2797
       "2019-04-02  985.274874   87.955000   83.221667    2.445000       0.05   \n",
2798
       "2019-04-03  790.862084  116.270833  107.811667   21.199167       0.00   \n",
2799
       "2019-04-04  738.126551  160.467500  128.485000  112.169167       0.00   \n",
2800
       "2019-04-05  846.904428  225.915833   94.376667  376.993333       0.00   \n",
2801
       "...                ...         ...         ...         ...        ...   \n",
2802
       "2019-10-27  963.436168   50.277500   45.353333    0.026667       0.00   \n",
2803
       "2019-10-28  895.893447   95.483333   30.701667  225.355000       0.00   \n",
2804
       "2019-10-29  833.864494   61.040000   42.480833   51.544167       0.00   \n",
2805
       "2019-10-30  745.242319   32.364167   29.780833    0.000000       0.00   \n",
2806
       "2019-10-31  723.901020   93.960000   49.780000  170.127500       0.00   \n",
2807
       "\n",
2808
       "             avgws10     avgwd10  retrofit  \n",
2809
       "timestamp                                   \n",
2810
       "2019-04-01  3.335575   37.478949         0  \n",
2811
       "2019-04-02  1.135126  209.014923         0  \n",
2812
       "2019-04-03  1.599006  141.619137         0  \n",
2813
       "2019-04-04  1.181543  178.318237         0  \n",
2814
       "2019-04-05  2.706478   30.143506         0  \n",
2815
       "...              ...         ...       ...  \n",
2816
       "2019-10-27  0.675000  212.700000         1  \n",
2817
       "2019-10-28  0.570000  185.550000         1  \n",
2818
       "2019-10-29  1.270000   36.745000         1  \n",
2819
       "2019-10-30  2.005000   44.650000         1  \n",
2820
       "2019-10-31  1.125000   53.745000         1  \n",
2821
       "\n",
2822
       "[61 rows x 17 columns]"
2823
      ]
2824
     },
2825
     "execution_count": 7,
2826
     "metadata": {},
2827
     "output_type": "execute_result"
2828
    }
2829
   ],
2830
   "source": [
2831
    "dfall"
2832
   ]
2833
  },
2834
  {
2835
   "cell_type": "code",
2836
   "execution_count": 8,
2837
   "id": "3f4497ea",
2838
   "metadata": {},
2839
   "outputs": [],
2840
   "source": [
2841
    "df_1 = dfall.drop(['strain_2','strain_3','strain_5','strain_8'],axis=1).rename(columns={\"strain_1\": \"strain\"})\n",
2842
    "df_2 = dfall.drop(['strain_1','strain_3','strain_5','strain_8'],axis=1).rename(columns={\"strain_2\": \"strain\"})\n",
2843
    "df_3 = dfall.drop(['strain_1','strain_2','strain_5','strain_8'],axis=1).rename(columns={\"strain_3\": \"strain\"})\n",
2844
    "df_5 = dfall.drop(['strain_1','strain_2','strain_3','strain_8'],axis=1).rename(columns={\"strain_5\": \"strain\"})\n",
2845
    "df_8 = dfall.drop(['strain_1','strain_2','strain_3','strain_5'],axis=1).rename(columns={\"strain_8\": \"strain\"})"
2846
   ]
2847
  },
2848
  {
2849
   "cell_type": "code",
2850
   "execution_count": 9,
2851
   "id": "9e343c23",
2852
   "metadata": {},
2853
   "outputs": [],
2854
   "source": [
2855
    "df_1[\"lx (m)\"] = 34.140625\n",
2856
    "df_2[\"lx (m)\"] = 48.515625\n",
2857
    "df_3[\"lx (m)\"] = 59.296875\n",
2858
    "df_5[\"lx (m)\"] = 80.859375\n",
2859
    "df_8[\"lx (m)\"] = 95.234375"
2860
   ]
2861
  },
2862
  {
2863
   "cell_type": "code",
2864
   "execution_count": 10,
2865
   "id": "3a57124a",
2866
   "metadata": {},
2867
   "outputs": [],
2868
   "source": [
2869
    "df_comp = df_1.append(df_2)\n",
2870
    "df_comp  = df_comp.append(df_3)\n",
2871
    "df_comp  = df_comp.append(df_5)\n",
2872
    "df_comp  = df_comp.append(df_8)"
2873
   ]
2874
  },
2875
  {
2876
   "cell_type": "code",
2877
   "execution_count": null,
2878
   "id": "03499b55",
2879
   "metadata": {},
2880
   "outputs": [],
2881
   "source": [
2882
    "plt.figure(figsize=(20,10))\n",
2883
    "plt.plot(df_1['timestamp'], df_1['strain'], marker='o', linestyle='--', color='r', label='Strain_1') \n",
2884
    "plt.plot(df_2['timestamp'], df_2['strain'], marker='o', linestyle='--', color='orange', label='Strain_2') \n",
2885
    "plt.plot(df_3['timestamp'], df_3['strain'], marker='o', linestyle='--', color='k', label='Strain_3') \n",
2886
    "plt.plot(df_5['timestamp'], df_5['strain'], marker='o', linestyle='--', color='y', label='Strain_5') \n",
2887
    "plt.plot(df_8['timestamp'], df_8['strain'], marker='o', linestyle='--', color='g', label='Strain_8') \n",
2888
    "plt.xticks(rotation=90)\n",
2889
    "plt.xlabel('Time Stamp')\n",
2890
    "plt.ylabel('Strain Value')\n",
2891
    "plt.legend()"
2892
   ]
2893
  },
2894
  {
2895
   "cell_type": "code",
2896
   "execution_count": 170,
2897
   "id": "97052d4e",
2898
   "metadata": {},
2899
   "outputs": [
2900
    {
2901
     "data": {
2902
      "text/html": [
2903
       "<div>\n",
2904
       "<style scoped>\n",
2905
       "    .dataframe tbody tr th:only-of-type {\n",
2906
       "        vertical-align: middle;\n",
2907
       "    }\n",
2908
       "\n",
2909
       "    .dataframe tbody tr th {\n",
2910
       "        vertical-align: top;\n",
2911
       "    }\n",
2912
       "\n",
2913
       "    .dataframe thead th {\n",
2914
       "        text-align: right;\n",
2915
       "    }\n",
2916
       "</style>\n",
2917
       "<table border=\"1\" class=\"dataframe\">\n",
2918
       "  <thead>\n",
2919
       "    <tr style=\"text-align: right;\">\n",
2920
       "      <th></th>\n",
2921
       "      <th>timestamp</th>\n",
2922
       "      <th>strain</th>\n",
2923
       "      <th>Surftemp</th>\n",
2924
       "      <th>Rh</th>\n",
2925
       "      <th>airtemp</th>\n",
2926
       "      <th>avgRh</th>\n",
2927
       "      <th>avgVPr</th>\n",
2928
       "      <th>avgGR</th>\n",
2929
       "      <th>avgdR</th>\n",
2930
       "      <th>avgdnr</th>\n",
2931
       "      <th>totalrain</th>\n",
2932
       "      <th>avgws10</th>\n",
2933
       "      <th>avgwd10</th>\n",
2934
       "      <th>retrofit</th>\n",
2935
       "      <th>lx (m)</th>\n",
2936
       "    </tr>\n",
2937
       "  </thead>\n",
2938
       "  <tbody>\n",
2939
       "    <tr>\n",
2940
       "      <th>0</th>\n",
2941
       "      <td>2019-04-01</td>\n",
2942
       "      <td>1.391124e-06</td>\n",
2943
       "      <td>11.802222</td>\n",
2944
       "      <td>51.495514</td>\n",
2945
       "      <td>11.349167</td>\n",
2946
       "      <td>56.125002</td>\n",
2947
       "      <td>708.982498</td>\n",
2948
       "      <td>233.389167</td>\n",
2949
       "      <td>87.455833</td>\n",
2950
       "      <td>478.697500</td>\n",
2951
       "      <td>0.00</td>\n",
2952
       "      <td>3.335575</td>\n",
2953
       "      <td>37.478949</td>\n",
2954
       "      <td>0</td>\n",
2955
       "      <td>34.140625</td>\n",
2956
       "    </tr>\n",
2957
       "    <tr>\n",
2958
       "      <th>1</th>\n",
2959
       "      <td>2019-04-02</td>\n",
2960
       "      <td>1.902302e-06</td>\n",
2961
       "      <td>11.776378</td>\n",
2962
       "      <td>72.111068</td>\n",
2963
       "      <td>10.497500</td>\n",
2964
       "      <td>77.708336</td>\n",
2965
       "      <td>985.274874</td>\n",
2966
       "      <td>87.955000</td>\n",
2967
       "      <td>83.221667</td>\n",
2968
       "      <td>2.445000</td>\n",
2969
       "      <td>0.05</td>\n",
2970
       "      <td>1.135126</td>\n",
2971
       "      <td>209.014923</td>\n",
2972
       "      <td>0</td>\n",
2973
       "      <td>34.140625</td>\n",
2974
       "    </tr>\n",
2975
       "    <tr>\n",
2976
       "      <th>2</th>\n",
2977
       "      <td>2019-04-03</td>\n",
2978
       "      <td>7.411497e-07</td>\n",
2979
       "      <td>8.487706</td>\n",
2980
       "      <td>69.587566</td>\n",
2981
       "      <td>8.279167</td>\n",
2982
       "      <td>72.916666</td>\n",
2983
       "      <td>790.862084</td>\n",
2984
       "      <td>116.270833</td>\n",
2985
       "      <td>107.811667</td>\n",
2986
       "      <td>21.199167</td>\n",
2987
       "      <td>0.00</td>\n",
2988
       "      <td>1.599006</td>\n",
2989
       "      <td>141.619137</td>\n",
2990
       "      <td>0</td>\n",
2991
       "      <td>34.140625</td>\n",
2992
       "    </tr>\n",
2993
       "    <tr>\n",
2994
       "      <th>3</th>\n",
2995
       "      <td>2019-04-04</td>\n",
2996
       "      <td>4.070716e-07</td>\n",
2997
       "      <td>7.694840</td>\n",
2998
       "      <td>71.085618</td>\n",
2999
       "      <td>7.617500</td>\n",
3000
       "      <td>72.458332</td>\n",
3001
       "      <td>738.126551</td>\n",
3002
       "      <td>160.467500</td>\n",
3003
       "      <td>128.485000</td>\n",
3004
       "      <td>112.169167</td>\n",
3005
       "      <td>0.00</td>\n",
3006
       "      <td>1.181543</td>\n",
3007
       "      <td>178.318237</td>\n",
3008
       "      <td>0</td>\n",
3009
       "      <td>34.140625</td>\n",
3010
       "    </tr>\n",
3011
       "    <tr>\n",
3012
       "      <th>4</th>\n",
3013
       "      <td>2019-04-05</td>\n",
3014
       "      <td>2.359754e-06</td>\n",
3015
       "      <td>9.097269</td>\n",
3016
       "      <td>66.807711</td>\n",
3017
       "      <td>9.810000</td>\n",
3018
       "      <td>71.999998</td>\n",
3019
       "      <td>846.904428</td>\n",
3020
       "      <td>225.915833</td>\n",
3021
       "      <td>94.376667</td>\n",
3022
       "      <td>376.993333</td>\n",
3023
       "      <td>0.00</td>\n",
3024
       "      <td>2.706478</td>\n",
3025
       "      <td>30.143506</td>\n",
3026
       "      <td>0</td>\n",
3027
       "      <td>34.140625</td>\n",
3028
       "    </tr>\n",
3029
       "    <tr>\n",
3030
       "      <th>...</th>\n",
3031
       "      <td>...</td>\n",
3032
       "      <td>...</td>\n",
3033
       "      <td>...</td>\n",
3034
       "      <td>...</td>\n",
3035
       "      <td>...</td>\n",
3036
       "      <td>...</td>\n",
3037
       "      <td>...</td>\n",
3038
       "      <td>...</td>\n",
3039
       "      <td>...</td>\n",
3040
       "      <td>...</td>\n",
3041
       "      <td>...</td>\n",
3042
       "      <td>...</td>\n",
3043
       "      <td>...</td>\n",
3044
       "      <td>...</td>\n",
3045
       "      <td>...</td>\n",
3046
       "    </tr>\n",
3047
       "    <tr>\n",
3048
       "      <th>56</th>\n",
3049
       "      <td>2019-10-27</td>\n",
3050
       "      <td>1.166937e-07</td>\n",
3051
       "      <td>11.353086</td>\n",
3052
       "      <td>74.968842</td>\n",
3053
       "      <td>8.625833</td>\n",
3054
       "      <td>86.211667</td>\n",
3055
       "      <td>963.436168</td>\n",
3056
       "      <td>50.277500</td>\n",
3057
       "      <td>45.353333</td>\n",
3058
       "      <td>0.026667</td>\n",
3059
       "      <td>0.00</td>\n",
3060
       "      <td>0.675000</td>\n",
3061
       "      <td>212.700000</td>\n",
3062
       "      <td>1</td>\n",
3063
       "      <td>95.234375</td>\n",
3064
       "    </tr>\n",
3065
       "    <tr>\n",
3066
       "      <th>57</th>\n",
3067
       "      <td>2019-10-28</td>\n",
3068
       "      <td>5.393001e-06</td>\n",
3069
       "      <td>9.467404</td>\n",
3070
       "      <td>80.369227</td>\n",
3071
       "      <td>6.798333</td>\n",
3072
       "      <td>90.648333</td>\n",
3073
       "      <td>895.893447</td>\n",
3074
       "      <td>95.483333</td>\n",
3075
       "      <td>30.701667</td>\n",
3076
       "      <td>225.355000</td>\n",
3077
       "      <td>0.00</td>\n",
3078
       "      <td>0.570000</td>\n",
3079
       "      <td>185.550000</td>\n",
3080
       "      <td>1</td>\n",
3081
       "      <td>95.234375</td>\n",
3082
       "    </tr>\n",
3083
       "    <tr>\n",
3084
       "      <th>58</th>\n",
3085
       "      <td>2019-10-29</td>\n",
3086
       "      <td>1.546657e-06</td>\n",
3087
       "      <td>9.921486</td>\n",
3088
       "      <td>76.104669</td>\n",
3089
       "      <td>8.613333</td>\n",
3090
       "      <td>74.891667</td>\n",
3091
       "      <td>833.864494</td>\n",
3092
       "      <td>61.040000</td>\n",
3093
       "      <td>42.480833</td>\n",
3094
       "      <td>51.544167</td>\n",
3095
       "      <td>0.00</td>\n",
3096
       "      <td>1.270000</td>\n",
3097
       "      <td>36.745000</td>\n",
3098
       "      <td>1</td>\n",
3099
       "      <td>95.234375</td>\n",
3100
       "    </tr>\n",
3101
       "    <tr>\n",
3102
       "      <th>59</th>\n",
3103
       "      <td>2019-10-30</td>\n",
3104
       "      <td>4.421555e-06</td>\n",
3105
       "      <td>7.566899</td>\n",
3106
       "      <td>77.632557</td>\n",
3107
       "      <td>6.325000</td>\n",
3108
       "      <td>78.035833</td>\n",
3109
       "      <td>745.242319</td>\n",
3110
       "      <td>32.364167</td>\n",
3111
       "      <td>29.780833</td>\n",
3112
       "      <td>0.000000</td>\n",
3113
       "      <td>0.00</td>\n",
3114
       "      <td>2.005000</td>\n",
3115
       "      <td>44.650000</td>\n",
3116
       "      <td>1</td>\n",
3117
       "      <td>95.234375</td>\n",
3118
       "    </tr>\n",
3119
       "    <tr>\n",
3120
       "      <th>60</th>\n",
3121
       "      <td>2019-10-31</td>\n",
3122
       "      <td>4.201527e-06</td>\n",
3123
       "      <td>6.945136</td>\n",
3124
       "      <td>76.931039</td>\n",
3125
       "      <td>5.306667</td>\n",
3126
       "      <td>81.060000</td>\n",
3127
       "      <td>723.901020</td>\n",
3128
       "      <td>93.960000</td>\n",
3129
       "      <td>49.780000</td>\n",
3130
       "      <td>170.127500</td>\n",
3131
       "      <td>0.00</td>\n",
3132
       "      <td>1.125000</td>\n",
3133
       "      <td>53.745000</td>\n",
3134
       "      <td>1</td>\n",
3135
       "      <td>95.234375</td>\n",
3136
       "    </tr>\n",
3137
       "  </tbody>\n",
3138
       "</table>\n",
3139
       "<p>305 rows × 15 columns</p>\n",
3140
       "</div>"
3141
      ],
3142
      "text/plain": [
3143
       "     timestamp        strain   Surftemp         Rh    airtemp      avgRh  \\\n",
3144
       "0   2019-04-01  1.391124e-06  11.802222  51.495514  11.349167  56.125002   \n",
3145
       "1   2019-04-02  1.902302e-06  11.776378  72.111068  10.497500  77.708336   \n",
3146
       "2   2019-04-03  7.411497e-07   8.487706  69.587566   8.279167  72.916666   \n",
3147
       "3   2019-04-04  4.070716e-07   7.694840  71.085618   7.617500  72.458332   \n",
3148
       "4   2019-04-05  2.359754e-06   9.097269  66.807711   9.810000  71.999998   \n",
3149
       "..         ...           ...        ...        ...        ...        ...   \n",
3150
       "56  2019-10-27  1.166937e-07  11.353086  74.968842   8.625833  86.211667   \n",
3151
       "57  2019-10-28  5.393001e-06   9.467404  80.369227   6.798333  90.648333   \n",
3152
       "58  2019-10-29  1.546657e-06   9.921486  76.104669   8.613333  74.891667   \n",
3153
       "59  2019-10-30  4.421555e-06   7.566899  77.632557   6.325000  78.035833   \n",
3154
       "60  2019-10-31  4.201527e-06   6.945136  76.931039   5.306667  81.060000   \n",
3155
       "\n",
3156
       "        avgVPr       avgGR       avgdR      avgdnr  totalrain   avgws10  \\\n",
3157
       "0   708.982498  233.389167   87.455833  478.697500       0.00  3.335575   \n",
3158
       "1   985.274874   87.955000   83.221667    2.445000       0.05  1.135126   \n",
3159
       "2   790.862084  116.270833  107.811667   21.199167       0.00  1.599006   \n",
3160
       "3   738.126551  160.467500  128.485000  112.169167       0.00  1.181543   \n",
3161
       "4   846.904428  225.915833   94.376667  376.993333       0.00  2.706478   \n",
3162
       "..         ...         ...         ...         ...        ...       ...   \n",
3163
       "56  963.436168   50.277500   45.353333    0.026667       0.00  0.675000   \n",
3164
       "57  895.893447   95.483333   30.701667  225.355000       0.00  0.570000   \n",
3165
       "58  833.864494   61.040000   42.480833   51.544167       0.00  1.270000   \n",
3166
       "59  745.242319   32.364167   29.780833    0.000000       0.00  2.005000   \n",
3167
       "60  723.901020   93.960000   49.780000  170.127500       0.00  1.125000   \n",
3168
       "\n",
3169
       "       avgwd10  retrofit     lx (m)  \n",
3170
       "0    37.478949         0  34.140625  \n",
3171
       "1   209.014923         0  34.140625  \n",
3172
       "2   141.619137         0  34.140625  \n",
3173
       "3   178.318237         0  34.140625  \n",
3174
       "4    30.143506         0  34.140625  \n",
3175
       "..         ...       ...        ...  \n",
3176
       "56  212.700000         1  95.234375  \n",
3177
       "57  185.550000         1  95.234375  \n",
3178
       "58   36.745000         1  95.234375  \n",
3179
       "59   44.650000         1  95.234375  \n",
3180
       "60   53.745000         1  95.234375  \n",
3181
       "\n",
3182
       "[305 rows x 15 columns]"
3183
      ]
3184
     },
3185
     "execution_count": 170,
3186
     "metadata": {},
3187
     "output_type": "execute_result"
3188
    }
3189
   ],
3190
   "source": [
3191
    "df_comp"
3192
   ]
3193
  },
3194
  {
3195
   "cell_type": "code",
3196
   "execution_count": 13,
3197
   "id": "b73b8554",
3198
   "metadata": {},
3199
   "outputs": [
3200
    {
3201
     "data": {
3202
      "text/plain": [
3203
       "LinearRegression()"
3204
      ]
3205
     },
3206
     "execution_count": 13,
3207
     "metadata": {},
3208
     "output_type": "execute_result"
3209
    }
3210
   ],
3211
   "source": [
3212
    "#run linear regression\n",
3213
    "\n",
3214
    "import numpy as np\n",
3215
    "import pandas as pd\n",
3216
    "from sklearn.linear_model import LinearRegression\n",
3217
    "import matplotlib.pyplot as plt\n",
3218
    "%matplotlib inline\n",
3219
    "from sklearn.model_selection import train_test_split\n",
3220
    "\n",
3221
    "#dealing with missing values\n",
3222
    "X = df_comp.drop('strain', axis=1)\n",
3223
    "y = df_comp['strain']\n",
3224
    "\n",
3225
    "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)\n",
3226
    "\n",
3227
    "lr = LinearRegression()\n",
3228
    "lr.fit(X_train, y_train)\n"
3229
   ]
3230
  },
3231
  {
3232
   "cell_type": "code",
3233
   "execution_count": 182,
3234
   "id": "6f545ec4",
3235
   "metadata": {},
3236
   "outputs": [
3237
    {
3238
     "data": {
3239
      "text/plain": [
3240
       "array([-7.32918585e-07, -2.31772820e-07,  1.07521188e-06,  2.83471035e-07,\n",
3241
       "       -4.83768362e-09,  1.14031235e-08, -2.04704203e-08, -6.49621047e-09,\n",
3242
       "       -1.70444583e-06,  8.94803691e-08, -3.00796022e-09, -5.62001361e-07,\n",
3243
       "        3.14184517e-08])"
3244
      ]
3245
     },
3246
     "execution_count": 182,
3247
     "metadata": {},
3248
     "output_type": "execute_result"
3249
    }
3250
   ],
3251
   "source": [
3252
    "lr.coef_"
3253
   ]
3254
  },
3255
  {
3256
   "cell_type": "code",
3257
   "execution_count": 183,
3258
   "id": "252c0de5",
3259
   "metadata": {},
3260
   "outputs": [
3261
    {
3262
     "data": {
3263
      "text/plain": [
3264
       "-2.3164128924815833e-06"
3265
      ]
3266
     },
3267
     "execution_count": 183,
3268
     "metadata": {},
3269
     "output_type": "execute_result"
3270
    }
3271
   ],
3272
   "source": [
3273
    "lr.intercept_"
3274
   ]
3275
  },
3276
  {
3277
   "cell_type": "code",
3278
   "execution_count": 184,
3279
   "id": "2a6a1bd9",
3280
   "metadata": {},
3281
   "outputs": [
3282
    {
3283
     "data": {
3284
      "text/plain": [
3285
       "0.3924089764234414"
3286
      ]
3287
     },
3288
     "execution_count": 184,
3289
     "metadata": {},
3290
     "output_type": "execute_result"
3291
    }
3292
   ],
3293
   "source": [
3294
    "lr.score(X_test, y_test)"
3295
   ]
3296
  },
3297
  {
3298
   "cell_type": "code",
3299
   "execution_count": 185,
3300
   "id": "a55527fa",
3301
   "metadata": {},
3302
   "outputs": [
3303
    {
3304
     "data": {
3305
      "text/html": [
3306
       "<div>\n",
3307
       "<style scoped>\n",
3308
       "    .dataframe tbody tr th:only-of-type {\n",
3309
       "        vertical-align: middle;\n",
3310
       "    }\n",
3311
       "\n",
3312
       "    .dataframe tbody tr th {\n",
3313
       "        vertical-align: top;\n",
3314
       "    }\n",
3315
       "\n",
3316
       "    .dataframe thead th {\n",
3317
       "        text-align: right;\n",
3318
       "    }\n",
3319
       "</style>\n",
3320
       "<table border=\"1\" class=\"dataframe\">\n",
3321
       "  <thead>\n",
3322
       "    <tr style=\"text-align: right;\">\n",
3323
       "      <th></th>\n",
3324
       "      <th>Surftemp</th>\n",
3325
       "      <th>Rh</th>\n",
3326
       "      <th>airtemp</th>\n",
3327
       "      <th>avgRh</th>\n",
3328
       "      <th>avgVPr</th>\n",
3329
       "      <th>avgGR</th>\n",
3330
       "      <th>avgdR</th>\n",
3331
       "      <th>avgdnr</th>\n",
3332
       "      <th>totalrain</th>\n",
3333
       "      <th>avgws10</th>\n",
3334
       "      <th>avgwd10</th>\n",
3335
       "      <th>retrofit</th>\n",
3336
       "      <th>lx (m)</th>\n",
3337
       "    </tr>\n",
3338
       "  </thead>\n",
3339
       "  <tbody>\n",
3340
       "    <tr>\n",
3341
       "      <th>Surftemp</th>\n",
3342
       "      <td>1.000000e+00</td>\n",
3343
       "      <td>-2.152850e-01</td>\n",
3344
       "      <td>9.747528e-01</td>\n",
3345
       "      <td>-2.983697e-01</td>\n",
3346
       "      <td>5.684068e-01</td>\n",
3347
       "      <td>9.519627e-02</td>\n",
3348
       "      <td>-8.447963e-02</td>\n",
3349
       "      <td>1.256301e-01</td>\n",
3350
       "      <td>4.533550e-02</td>\n",
3351
       "      <td>1.839667e-01</td>\n",
3352
       "      <td>-4.586977e-02</td>\n",
3353
       "      <td>7.498677e-02</td>\n",
3354
       "      <td>1.677069e-16</td>\n",
3355
       "    </tr>\n",
3356
       "    <tr>\n",
3357
       "      <th>Rh</th>\n",
3358
       "      <td>-2.152850e-01</td>\n",
3359
       "      <td>1.000000e+00</td>\n",
3360
       "      <td>-2.480698e-01</td>\n",
3361
       "      <td>9.723831e-01</td>\n",
3362
       "      <td>6.446555e-01</td>\n",
3363
       "      <td>-8.661916e-01</td>\n",
3364
       "      <td>-5.956108e-01</td>\n",
3365
       "      <td>-8.056235e-01</td>\n",
3366
       "      <td>2.042600e-01</td>\n",
3367
       "      <td>-5.197775e-01</td>\n",
3368
       "      <td>4.503028e-01</td>\n",
3369
       "      <td>7.288194e-01</td>\n",
3370
       "      <td>7.335662e-16</td>\n",
3371
       "    </tr>\n",
3372
       "    <tr>\n",
3373
       "      <th>airtemp</th>\n",
3374
       "      <td>9.747528e-01</td>\n",
3375
       "      <td>-2.480698e-01</td>\n",
3376
       "      <td>1.000000e+00</td>\n",
3377
       "      <td>-3.616480e-01</td>\n",
3378
       "      <td>5.406419e-01</td>\n",
3379
       "      <td>1.694691e-01</td>\n",
3380
       "      <td>-3.510775e-02</td>\n",
3381
       "      <td>1.952337e-01</td>\n",
3382
       "      <td>4.971249e-03</td>\n",
3383
       "      <td>2.731617e-01</td>\n",
3384
       "      <td>-6.243032e-02</td>\n",
3385
       "      <td>2.017131e-03</td>\n",
3386
       "      <td>-6.014388e-16</td>\n",
3387
       "    </tr>\n",
3388
       "    <tr>\n",
3389
       "      <th>avgRh</th>\n",
3390
       "      <td>-2.983697e-01</td>\n",
3391
       "      <td>9.723831e-01</td>\n",
3392
       "      <td>-3.616480e-01</td>\n",
3393
       "      <td>1.000000e+00</td>\n",
3394
       "      <td>5.608952e-01</td>\n",
3395
       "      <td>-8.401467e-01</td>\n",
3396
       "      <td>-5.541348e-01</td>\n",
3397
       "      <td>-7.924454e-01</td>\n",
3398
       "      <td>2.558436e-01</td>\n",
3399
       "      <td>-5.950151e-01</td>\n",
3400
       "      <td>4.794773e-01</td>\n",
3401
       "      <td>6.712207e-01</td>\n",
3402
       "      <td>6.911524e-16</td>\n",
3403
       "    </tr>\n",
3404
       "    <tr>\n",
3405
       "      <th>avgVPr</th>\n",
3406
       "      <td>5.684068e-01</td>\n",
3407
       "      <td>6.446555e-01</td>\n",
3408
       "      <td>5.406419e-01</td>\n",
3409
       "      <td>5.608952e-01</td>\n",
3410
       "      <td>1.000000e+00</td>\n",
3411
       "      <td>-6.132273e-01</td>\n",
3412
       "      <td>-5.177388e-01</td>\n",
3413
       "      <td>-5.510338e-01</td>\n",
3414
       "      <td>2.094811e-01</td>\n",
3415
       "      <td>-2.036595e-01</td>\n",
3416
       "      <td>3.509903e-01</td>\n",
3417
       "      <td>6.112809e-01</td>\n",
3418
       "      <td>-2.054537e-16</td>\n",
3419
       "    </tr>\n",
3420
       "    <tr>\n",
3421
       "      <th>avgGR</th>\n",
3422
       "      <td>9.519627e-02</td>\n",
3423
       "      <td>-8.661916e-01</td>\n",
3424
       "      <td>1.694691e-01</td>\n",
3425
       "      <td>-8.401467e-01</td>\n",
3426
       "      <td>-6.132273e-01</td>\n",
3427
       "      <td>1.000000e+00</td>\n",
3428
       "      <td>7.293697e-01</td>\n",
3429
       "      <td>9.061787e-01</td>\n",
3430
       "      <td>-1.775341e-01</td>\n",
3431
       "      <td>4.630690e-01</td>\n",
3432
       "      <td>-2.412233e-01</td>\n",
3433
       "      <td>-7.829176e-01</td>\n",
3434
       "      <td>4.095492e-16</td>\n",
3435
       "    </tr>\n",
3436
       "    <tr>\n",
3437
       "      <th>avgdR</th>\n",
3438
       "      <td>-8.447963e-02</td>\n",
3439
       "      <td>-5.956108e-01</td>\n",
3440
       "      <td>-3.510775e-02</td>\n",
3441
       "      <td>-5.541348e-01</td>\n",
3442
       "      <td>-5.177388e-01</td>\n",
3443
       "      <td>7.293697e-01</td>\n",
3444
       "      <td>1.000000e+00</td>\n",
3445
       "      <td>3.899672e-01</td>\n",
3446
       "      <td>-1.374128e-01</td>\n",
3447
       "      <td>2.765396e-01</td>\n",
3448
       "      <td>-2.703759e-02</td>\n",
3449
       "      <td>-7.715444e-01</td>\n",
3450
       "      <td>-7.025112e-16</td>\n",
3451
       "    </tr>\n",
3452
       "    <tr>\n",
3453
       "      <th>avgdnr</th>\n",
3454
       "      <td>1.256301e-01</td>\n",
3455
       "      <td>-8.056235e-01</td>\n",
3456
       "      <td>1.952337e-01</td>\n",
3457
       "      <td>-7.924454e-01</td>\n",
3458
       "      <td>-5.510338e-01</td>\n",
3459
       "      <td>9.061787e-01</td>\n",
3460
       "      <td>3.899672e-01</td>\n",
3461
       "      <td>1.000000e+00</td>\n",
3462
       "      <td>-1.841247e-01</td>\n",
3463
       "      <td>4.780176e-01</td>\n",
3464
       "      <td>-3.274065e-01</td>\n",
3465
       "      <td>-5.869362e-01</td>\n",
3466
       "      <td>4.600683e-17</td>\n",
3467
       "    </tr>\n",
3468
       "    <tr>\n",
3469
       "      <th>totalrain</th>\n",
3470
       "      <td>4.533550e-02</td>\n",
3471
       "      <td>2.042600e-01</td>\n",
3472
       "      <td>4.971249e-03</td>\n",
3473
       "      <td>2.558436e-01</td>\n",
3474
       "      <td>2.094811e-01</td>\n",
3475
       "      <td>-1.775341e-01</td>\n",
3476
       "      <td>-1.374128e-01</td>\n",
3477
       "      <td>-1.841247e-01</td>\n",
3478
       "      <td>1.000000e+00</td>\n",
3479
       "      <td>-1.593518e-01</td>\n",
3480
       "      <td>1.882248e-01</td>\n",
3481
       "      <td>-5.927637e-02</td>\n",
3482
       "      <td>9.468082e-17</td>\n",
3483
       "    </tr>\n",
3484
       "    <tr>\n",
3485
       "      <th>avgws10</th>\n",
3486
       "      <td>1.839667e-01</td>\n",
3487
       "      <td>-5.197775e-01</td>\n",
3488
       "      <td>2.731617e-01</td>\n",
3489
       "      <td>-5.950151e-01</td>\n",
3490
       "      <td>-2.036595e-01</td>\n",
3491
       "      <td>4.630690e-01</td>\n",
3492
       "      <td>2.765396e-01</td>\n",
3493
       "      <td>4.780176e-01</td>\n",
3494
       "      <td>-1.593518e-01</td>\n",
3495
       "      <td>1.000000e+00</td>\n",
3496
       "      <td>-2.644061e-01</td>\n",
3497
       "      <td>-2.872552e-01</td>\n",
3498
       "      <td>-1.120402e-15</td>\n",
3499
       "    </tr>\n",
3500
       "    <tr>\n",
3501
       "      <th>avgwd10</th>\n",
3502
       "      <td>-4.586977e-02</td>\n",
3503
       "      <td>4.503028e-01</td>\n",
3504
       "      <td>-6.243032e-02</td>\n",
3505
       "      <td>4.794773e-01</td>\n",
3506
       "      <td>3.509903e-01</td>\n",
3507
       "      <td>-2.412233e-01</td>\n",
3508
       "      <td>-2.703759e-02</td>\n",
3509
       "      <td>-3.274065e-01</td>\n",
3510
       "      <td>1.882248e-01</td>\n",
3511
       "      <td>-2.644061e-01</td>\n",
3512
       "      <td>1.000000e+00</td>\n",
3513
       "      <td>1.689668e-01</td>\n",
3514
       "      <td>2.738244e-16</td>\n",
3515
       "    </tr>\n",
3516
       "    <tr>\n",
3517
       "      <th>retrofit</th>\n",
3518
       "      <td>7.498677e-02</td>\n",
3519
       "      <td>7.288194e-01</td>\n",
3520
       "      <td>2.017131e-03</td>\n",
3521
       "      <td>6.712207e-01</td>\n",
3522
       "      <td>6.112809e-01</td>\n",
3523
       "      <td>-7.829176e-01</td>\n",
3524
       "      <td>-7.715444e-01</td>\n",
3525
       "      <td>-5.869362e-01</td>\n",
3526
       "      <td>-5.927637e-02</td>\n",
3527
       "      <td>-2.872552e-01</td>\n",
3528
       "      <td>1.689668e-01</td>\n",
3529
       "      <td>1.000000e+00</td>\n",
3530
       "      <td>2.020656e-16</td>\n",
3531
       "    </tr>\n",
3532
       "    <tr>\n",
3533
       "      <th>lx (m)</th>\n",
3534
       "      <td>1.677069e-16</td>\n",
3535
       "      <td>7.335662e-16</td>\n",
3536
       "      <td>-6.014388e-16</td>\n",
3537
       "      <td>6.911524e-16</td>\n",
3538
       "      <td>-2.054537e-16</td>\n",
3539
       "      <td>4.095492e-16</td>\n",
3540
       "      <td>-7.025112e-16</td>\n",
3541
       "      <td>4.600683e-17</td>\n",
3542
       "      <td>9.468082e-17</td>\n",
3543
       "      <td>-1.120402e-15</td>\n",
3544
       "      <td>2.738244e-16</td>\n",
3545
       "      <td>2.020656e-16</td>\n",
3546
       "      <td>1.000000e+00</td>\n",
3547
       "    </tr>\n",
3548
       "  </tbody>\n",
3549
       "</table>\n",
3550
       "</div>"
3551
      ],
3552
      "text/plain": [
3553
       "               Surftemp            Rh       airtemp         avgRh  \\\n",
3554
       "Surftemp   1.000000e+00 -2.152850e-01  9.747528e-01 -2.983697e-01   \n",
3555
       "Rh        -2.152850e-01  1.000000e+00 -2.480698e-01  9.723831e-01   \n",
3556
       "airtemp    9.747528e-01 -2.480698e-01  1.000000e+00 -3.616480e-01   \n",
3557
       "avgRh     -2.983697e-01  9.723831e-01 -3.616480e-01  1.000000e+00   \n",
3558
       "avgVPr     5.684068e-01  6.446555e-01  5.406419e-01  5.608952e-01   \n",
3559
       "avgGR      9.519627e-02 -8.661916e-01  1.694691e-01 -8.401467e-01   \n",
3560
       "avgdR     -8.447963e-02 -5.956108e-01 -3.510775e-02 -5.541348e-01   \n",
3561
       "avgdnr     1.256301e-01 -8.056235e-01  1.952337e-01 -7.924454e-01   \n",
3562
       "totalrain  4.533550e-02  2.042600e-01  4.971249e-03  2.558436e-01   \n",
3563
       "avgws10    1.839667e-01 -5.197775e-01  2.731617e-01 -5.950151e-01   \n",
3564
       "avgwd10   -4.586977e-02  4.503028e-01 -6.243032e-02  4.794773e-01   \n",
3565
       "retrofit   7.498677e-02  7.288194e-01  2.017131e-03  6.712207e-01   \n",
3566
       "lx (m)     1.677069e-16  7.335662e-16 -6.014388e-16  6.911524e-16   \n",
3567
       "\n",
3568
       "                 avgVPr         avgGR         avgdR        avgdnr  \\\n",
3569
       "Surftemp   5.684068e-01  9.519627e-02 -8.447963e-02  1.256301e-01   \n",
3570
       "Rh         6.446555e-01 -8.661916e-01 -5.956108e-01 -8.056235e-01   \n",
3571
       "airtemp    5.406419e-01  1.694691e-01 -3.510775e-02  1.952337e-01   \n",
3572
       "avgRh      5.608952e-01 -8.401467e-01 -5.541348e-01 -7.924454e-01   \n",
3573
       "avgVPr     1.000000e+00 -6.132273e-01 -5.177388e-01 -5.510338e-01   \n",
3574
       "avgGR     -6.132273e-01  1.000000e+00  7.293697e-01  9.061787e-01   \n",
3575
       "avgdR     -5.177388e-01  7.293697e-01  1.000000e+00  3.899672e-01   \n",
3576
       "avgdnr    -5.510338e-01  9.061787e-01  3.899672e-01  1.000000e+00   \n",
3577
       "totalrain  2.094811e-01 -1.775341e-01 -1.374128e-01 -1.841247e-01   \n",
3578
       "avgws10   -2.036595e-01  4.630690e-01  2.765396e-01  4.780176e-01   \n",
3579
       "avgwd10    3.509903e-01 -2.412233e-01 -2.703759e-02 -3.274065e-01   \n",
3580
       "retrofit   6.112809e-01 -7.829176e-01 -7.715444e-01 -5.869362e-01   \n",
3581
       "lx (m)    -2.054537e-16  4.095492e-16 -7.025112e-16  4.600683e-17   \n",
3582
       "\n",
3583
       "              totalrain       avgws10       avgwd10      retrofit  \\\n",
3584
       "Surftemp   4.533550e-02  1.839667e-01 -4.586977e-02  7.498677e-02   \n",
3585
       "Rh         2.042600e-01 -5.197775e-01  4.503028e-01  7.288194e-01   \n",
3586
       "airtemp    4.971249e-03  2.731617e-01 -6.243032e-02  2.017131e-03   \n",
3587
       "avgRh      2.558436e-01 -5.950151e-01  4.794773e-01  6.712207e-01   \n",
3588
       "avgVPr     2.094811e-01 -2.036595e-01  3.509903e-01  6.112809e-01   \n",
3589
       "avgGR     -1.775341e-01  4.630690e-01 -2.412233e-01 -7.829176e-01   \n",
3590
       "avgdR     -1.374128e-01  2.765396e-01 -2.703759e-02 -7.715444e-01   \n",
3591
       "avgdnr    -1.841247e-01  4.780176e-01 -3.274065e-01 -5.869362e-01   \n",
3592
       "totalrain  1.000000e+00 -1.593518e-01  1.882248e-01 -5.927637e-02   \n",
3593
       "avgws10   -1.593518e-01  1.000000e+00 -2.644061e-01 -2.872552e-01   \n",
3594
       "avgwd10    1.882248e-01 -2.644061e-01  1.000000e+00  1.689668e-01   \n",
3595
       "retrofit  -5.927637e-02 -2.872552e-01  1.689668e-01  1.000000e+00   \n",
3596
       "lx (m)     9.468082e-17 -1.120402e-15  2.738244e-16  2.020656e-16   \n",
3597
       "\n",
3598
       "                 lx (m)  \n",
3599
       "Surftemp   1.677069e-16  \n",
3600
       "Rh         7.335662e-16  \n",
3601
       "airtemp   -6.014388e-16  \n",
3602
       "avgRh      6.911524e-16  \n",
3603
       "avgVPr    -2.054537e-16  \n",
3604
       "avgGR      4.095492e-16  \n",
3605
       "avgdR     -7.025112e-16  \n",
3606
       "avgdnr     4.600683e-17  \n",
3607
       "totalrain  9.468082e-17  \n",
3608
       "avgws10   -1.120402e-15  \n",
3609
       "avgwd10    2.738244e-16  \n",
3610
       "retrofit   2.020656e-16  \n",
3611
       "lx (m)     1.000000e+00  "
3612
      ]
3613
     },
3614
     "execution_count": 185,
3615
     "metadata": {},
3616
     "output_type": "execute_result"
3617
    }
3618
   ],
3619
   "source": [
3620
    "X.corr()"
3621
   ]
3622
  },
3623
  {
3624
   "cell_type": "code",
3625
   "execution_count": 138,
3626
   "id": "bc340140",
3627
   "metadata": {},
3628
   "outputs": [
3629
    {
3630
     "data": {
3631
      "text/plain": [
3632
       "<AxesSubplot:>"
3633
      ]
3634
     },
3635
     "execution_count": 138,
3636
     "metadata": {},
3637
     "output_type": "execute_result"
3638
    },
3639
    {
3640
     "data": {
3641
      "image/png": "\n",
3642
      "text/plain": [
3643
       "<Figure size 1080x576 with 2 Axes>"
3644
      ]
3645
     },
3646
     "metadata": {},
3647
     "output_type": "display_data"
3648
    }
3649
   ],
3650
   "source": [
3651
    "import seaborn as sns\n",
3652
    "sns.set(rc = {'figure.figsize':(15,8)})\n",
3653
    "sns.heatmap(X.corr())\n"
3654
   ]
3655
  },
3656
  {
3657
   "cell_type": "code",
3658
   "execution_count": 14,
3659
   "id": "5edc2102",
3660
   "metadata": {},
3661
   "outputs": [
3662
    {
3663
     "data": {
3664
      "text/plain": [
3665
       "array([-1.00330316e-06, -2.34493720e-07,  7.09387255e-07,  2.98206738e-07,\n",
3666
       "       -5.44373350e-09,  9.78316711e-09, -1.85111235e-08, -6.81229930e-09,\n",
3667
       "       -2.07917277e-06,  2.79915760e-07, -2.56745536e-09, -9.96398106e-07,\n",
3668
       "        3.11206047e-08,  2.65314746e-08,  2.52690794e-10,  2.48370481e-12])"
3669
      ]
3670
     },
3671
     "execution_count": 14,
3672
     "metadata": {},
3673
     "output_type": "execute_result"
3674
    }
3675
   ],
3676
   "source": [
3677
    "#Linear Regression with correlated variables\n",
3678
    "\n",
3679
    "# Air_temp and Surf_temp\n",
3680
    "# AvgRh and Rh\n",
3681
    "# Avgdnr and avgGR\n",
3682
    "\n",
3683
    "df_new = df_comp.copy()\n",
3684
    "df_new['airtemp*Surftemp'] = df_new['airtemp']*df_new['Surftemp']\n",
3685
    "df_new['avgRh*Rh'] = df_new['avgRh']*df_new['Rh']\n",
3686
    "df_new['avgdnr*avgGR'] = df_new['avgdnr']*df_new['avgGR']\n",
3687
    "X1 = df_new.drop('strain', axis=1)\n",
3688
    "y1 = df_new['strain']\n",
3689
    "X1_train, X1_test, y1_train, y1_test = train_test_split(X1, y1, test_size=0.3, random_state=42)\n",
3690
    "lr1 = LinearRegression()\n",
3691
    "lr1.fit(X1_train, y1_train)\n",
3692
    "lr1.coef_"
3693
   ]
3694
  },
3695
  {
3696
   "cell_type": "code",
3697
   "execution_count": 15,
3698
   "id": "9df6682b",
3699
   "metadata": {},
3700
   "outputs": [
3701
    {
3702
     "data": {
3703
      "text/plain": [
3704
       "-6.767178628037426e-07"
3705
      ]
3706
     },
3707
     "execution_count": 15,
3708
     "metadata": {},
3709
     "output_type": "execute_result"
3710
    }
3711
   ],
3712
   "source": [
3713
    "lr1.intercept_"
3714
   ]
3715
  },
3716
  {
3717
   "cell_type": "code",
3718
   "execution_count": 17,
3719
   "id": "ff1a4e98",
3720
   "metadata": {},
3721
   "outputs": [
3722
    {
3723
     "data": {
3724
      "text/plain": [
3725
       "0.4217589069954959"
3726
      ]
3727
     },
3728
     "execution_count": 17,
3729
     "metadata": {},
3730
     "output_type": "execute_result"
3731
    }
3732
   ],
3733
   "source": [
3734
    "lr1.score(X1_test,y1_test)"
3735
   ]
3736
  },
3737
  {
3738
   "cell_type": "code",
3739
   "execution_count": 18,
3740
   "id": "1f812841",
3741
   "metadata": {},
3742
   "outputs": [
3743
    {
3744
     "data": {
3745
      "text/plain": [
3746
       "array([-1.02847347e-06, -2.16258266e-07,  7.39409173e-07,  3.24857545e-07,\n",
3747
       "       -6.07804384e-09,  1.19045085e-08, -2.12715103e-08, -6.86964903e-09,\n",
3748
       "       -2.07847876e-06,  2.89672063e-07, -2.49922913e-09, -1.01819999e-06,\n",
3749
       "        3.09133416e-08,  2.80110267e-08])"
3750
      ]
3751
     },
3752
     "execution_count": 18,
3753
     "metadata": {},
3754
     "output_type": "execute_result"
3755
    }
3756
   ],
3757
   "source": [
3758
    "#final Linear Regression\n",
3759
    "\n",
3760
    "df_final = df_comp.copy()\n",
3761
    "df_final['airtemp*Surftemp'] = df_final['airtemp']*df_final['Surftemp'] \n",
3762
    "X2 = df_final.drop('strain', axis=1)\n",
3763
    "y2 = df_final['strain']\n",
3764
    "lr2 = LinearRegression()\n",
3765
    "X2_train, X2_test, y2_train, y2_test = train_test_split(X2, y2, test_size=0.3, random_state=42)\n",
3766
    "lr2.fit(X2_train,y2_train)\n",
3767
    "lr2.coef_"
3768
   ]
3769
  },
3770
  {
3771
   "cell_type": "code",
3772
   "execution_count": 19,
3773
   "id": "a579f226",
3774
   "metadata": {},
3775
   "outputs": [
3776
    {
3777
     "data": {
3778
      "text/plain": [
3779
       "-2.1807076893661185e-06"
3780
      ]
3781
     },
3782
     "execution_count": 19,
3783
     "metadata": {},
3784
     "output_type": "execute_result"
3785
    }
3786
   ],
3787
   "source": [
3788
    "lr2.intercept_"
3789
   ]
3790
  },
3791
  {
3792
   "cell_type": "code",
3793
   "execution_count": 20,
3794
   "id": "aaa8b9ef",
3795
   "metadata": {},
3796
   "outputs": [
3797
    {
3798
     "data": {
3799
      "text/plain": [
3800
       "0.42059142260398696"
3801
      ]
3802
     },
3803
     "execution_count": 20,
3804
     "metadata": {},
3805
     "output_type": "execute_result"
3806
    }
3807
   ],
3808
   "source": [
3809
    "lr2.score(X2_test, y2_test)"
3810
   ]
3811
  },
3812
  {
3813
   "cell_type": "code",
3814
   "execution_count": null,
3815
   "id": "d022ddd3",
3816
   "metadata": {},
3817
   "outputs": [],
3818
   "source": []
3819
  }
3820
 ],
3821
 "metadata": {
3822
  "kernelspec": {
3823
   "display_name": "Python 3",
3824
   "language": "python",
3825
   "name": "python3"
3826
  },
3827
  "language_info": {
3828
   "codemirror_mode": {
3829
    "name": "ipython",
3830
    "version": 3
3831
   },
3832
   "file_extension": ".py",
3833
   "mimetype": "text/x-python",
3834
   "name": "python",
3835
   "nbconvert_exporter": "python",
3836
   "pygments_lexer": "ipython3",
3837
   "version": "3.9.5"
3838
  }
3839
 },
3840
 "nbformat": 4,
3841
 "nbformat_minor": 5
3842
}