COVID-19_Multi-Omics / Git / [bd22c4] /src/dash/apps/linear

Models:
AlyssaS/
COVID-19_Multi-Omics
Downloads: 1
[bd22c4]: / src / dash / apps / linear_regression.py
History
Download this file
208 lines (166 with data), 7.6 kB

import dash
import dash_table
import dash_bootstrap_components as dbc
import dash_core_components as dcc
import dash_html_components as html
from dash.dependencies import Input, Output
import datetime
import pandas as pd

from data import get_omics_data, get_biomolecule_names, get_combined_data, get_p_values, get_volcano_data
from plot import correlation_scatter
from nav import navbar

# importing app through index page
from app import app
from apps import differential_expression

print()
print(datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
print("Loading data for linear_regression...")
print()

# load metabolomics data matrix
print("Loading metabolomics data...")
from app import metabolomics_df, metabolomics_quant_range
print("Metabolomics data shape: {}".format(metabolomics_df.shape))
print("Loading lipidomics data...")
from app import lipidomics_df, lipidomics_quant_range
print("Lipidomics data shape: {}".format(lipidomics_df.shape))
print("Loading proteomics data...")
from app import proteomics_df, proteomics_quant_range
print("Proteomics data shape: {}".format(proteomics_df.shape))
print("Loading transcriptomics data...")
from app import transcriptomics_df, transcriptomics_quant_range
print("Transcriptomics data shape: {}".format(transcriptomics_df.shape))

available_datasets = ['Proteins', 'Lipids', 'Metabolites', 'Combined Biomolecules', 'Transcripts']

# define dataset dictionaries
from app import dataset_dict, df_dict, quant_value_range_dict, global_names_dict
from app import metabolomics_biomolecule_names_dict
from app import lipidomics_biomolecule_names_dict
from app import proteomics_biomolecule_names_dict
from app import transcriptomics_biomolecule_names_dict

global_names_dict = {
    "proteomics":proteomics_biomolecule_names_dict,
    "lipidomics":lipidomics_biomolecule_names_dict,
    "metabolomics":metabolomics_biomolecule_names_dict,
    "combined":{**proteomics_biomolecule_names_dict,
                **lipidomics_biomolecule_names_dict,
                **metabolomics_biomolecule_names_dict,
                **transcriptomics_biomolecule_names_dict}
}

# get combined omics df and quant value range
print("Creating combined omics df...")
# get combined data with transcriptomics
df_dict, quant_value_range_dict = get_combined_data(df_dict,
    quant_value_range_dict, with_transcripts=True)

# start with proteomics data
sorted_biomolecule_names_dict = {k: v for k, v in sorted(global_names_dict['combined'].items(), key=lambda item: item[1])}
#available_biomolecules = proteomics_biomolecule_names_dict.values()
#available_biomolecules = proteomics_df.columns[:proteomics_quant_range].sort_values().tolist()
default_biomolecule = list(sorted_biomolecule_names_dict.keys())[0]

plotly_config = {"toImageButtonOptions":{'format':'svg',
                'filename': 'dash_plot'},
                "displaylogo": False}

# # NOTE: Need to add transcriptomics data here
dataset = 'combined'
combined_omics_df = df_dict[dataset]
quant_value_range = quant_value_range_dict[dataset]

available_datasets = ['Combined']
# start at COVID status
clinical_metadata_options = combined_omics_df.columns[quant_value_range+4:].sort_values().tolist()
clinical_metadata_options.remove("Days_admitted_before_enrollment")
clinical_metadata_options.remove("Plasma_or_CRRT_before_enrollment")
clinical_metadata_options.append('COVID')
biomolecule_options = [{'label': value, 'value': key} for key, value in sorted_biomolecule_names_dict.items() if key in combined_omics_df.columns.to_list()]

control_panel = dbc.Card(
    [
        dbc.CardHeader("CONTROL PANEL",
                            style={"background-color":"#5bc0de",
                                        "font-weight":"bold",
                                        "font-size":"large"}),
        dbc.CardBody(
            [html.P("Select Clinical Measurement", className="card-title", style={"font-weight":"bold"}),
            dcc.Dropdown(
                id='clinical_measurement-lr',
                options=[{'label': i, 'value': i} for i in clinical_metadata_options],
                # only passing in quant value columns
                value=clinical_metadata_options[0]),
            html.Hr(),
            html.P("Select Groups", className="card-title", style={"font-weight":"bold"}),
            dcc.Checklist(
                id='group-checklist-lr',
                options=[
                    {'label': ' COVID ICU', 'value': 'COVID_ICU'},
                    {'label': ' COVID NONICU', 'value': 'COVID_NONICU'},
                    {'label': ' NONCOVID ICU', 'value': 'NONCOVID_ICU'},
                    {'label': ' NONCOVID NONICU', 'value': 'NONCOVID_NONICU'}
                ],
                value=['COVID_ICU', 'COVID_NONICU', 'NONCOVID_ICU', 'NONCOVID_NONICU'],
                labelStyle={'display': 'inline-block'}
            ),
            html.Hr(),
            html.P("Select Biomolecule", className="card-title", style={"font-weight":"bold"}),

            # NOTE: This is dcc object not dbc
            dcc.Dropdown(
                id='biomolecule_id-lr',
                # label maps to biomolecule name, value to biomolecule_id
                options=biomolecule_options,
                # only passing in quant value columns
                value=default_biomolecule,
                className="dropdown-item p-0"),

                ])
    ])

first_card = dbc.Card(
    [
        dbc.CardHeader("BIOMOLECULE SCATTER PLOT",
                            style={"background-color":"#5bc0de",
                                        "font-weight":"bold",
                                        "font-size":"large"}),
        dbc.CardBody(dcc.Graph(id='scatter-lr',
        config=plotly_config))
    ])


#app.layout = dbc.Container([
layout = dbc.Container([

    navbar,

    html.Hr(),

    dbc.Row(dbc.Col(html.H1("COVID-19 Multi-Omics Data Dashboard"), width={"size": 6, "offset": 3})),

    html.Hr(),

    dbc.Row(
        [dbc.Col(
        dbc.Nav(
    [
        html.H3("TYPE OF ANALYSIS", style={"font-weight":"bold", "color":"black"}),

        dbc.NavItem(dbc.NavLink(html.Span("PCA"),
            disabled=False,
            href="pca",
            style={"color":"grey"})),



        dbc.NavItem(dbc.NavLink("Linear Regression", active=True, href="linear_regression", style={"background-color":"grey"})),

        dbc.NavItem(dbc.NavLink(

            html.Span(
                    "Differential Expression",
                    id="tooltip-lr",
                    style={"cursor": "pointer", "color":"grey"},
                ),disabled=False, href="differential_expression")),

        dbc.NavItem(dbc.NavLink(
            html.Span(
                    "Clustergrammer",
                    id="tooltip-cg",
                    style={"cursor":"pointer", "color":"grey"},
                ),disabled=False, href="clustergrammer")),


        html.Hr(),
        control_panel
    ],
    vertical="md",
    pills=True
        ), md=2, className="mb-3"),

        dbc.Col(first_card, md=7),
        ],

        className="mb-3"),


], fluid=True, style={"height": "100vh"})


@app.callback(
    Output('scatter-lr', 'figure'),
    [Input('biomolecule_id-lr', 'value'),
    Input('group-checklist-lr','value'),
    Input('clinical_measurement-lr', 'value')])
def update_biomolecule_scatter(biomolecule_id, groups, clinical_measurement):

    biomolecule_name = global_names_dict["combined"][biomolecule_id]
    fig = correlation_scatter(combined_omics_df, biomolecule_id, groups,
        biomolecule_name, clinical_measurement)

    return fig