app.py


# Run this app with `python app.py` and
# visit http://127.0.0.1:8050/ in your web browser.

# imports
from datetime import timedelta

import numpy as np
import plotly.graph_objects as go
from dash import Dash, Input, Output, ctx, dcc, html, no_update
from epispot import comps, models, pre
from epispot.analysis import normalize
from epispot.estimates.getters import query
from pandas import DataFrame, to_datetime

import core

# create app
app = Dash(__name__)
app.title = 'COVID-19 Notebook'
server = app.server


# get data
source = 'cumulative'
df = core.find.data(source=source)
counties = core.get.counties()


# globals
index = 0
data = [df.p_cases, df.p_deaths, df.death_rate]
labels = ['p_cases', 'p_deaths', 'death_rate']
zmax = [0.5, 0.01, 0.035]
center = {'lat': 37.0902, 'lon': -95.7129}
zoom = 3


# forecasting options
forecast = {
    'extent': 'None',
    'model': 'SIR',
    'behavior': 'Average',
}
params = {
    'gamma_inf': query(
        ('SARS-CoV-2', 'Mehra et al. 2020', 'gamma')
    )(0),
    'delay': 7,
    'undercount': 0.2,
    'low': {
        'R_0': 1.5,
        'delta': 0.1,
        'alpha': 0.0075,
        'rho': 0.07,
    },
    'average': {
        'R_0': 2.25,
        'delta': 0.2,
        'alpha': 0.01,
        'rho': 0.1,
    },
    'high': {
        'R_0': 3,
        'delta': 0.3,
        'alpha': 0.015,
        'rho': 0.14,
    }
}


# create main figure
fig = go.Figure(go.Choroplethmapbox(
    geojson=counties,
    locations=df.fips,
    z=df.p_cases,
    zmin=0, zmax=0.5,
    colorscale=[
        [0, '#adffc2'],
        [0.5, '#ff9382'],
        [1, '#c90061']
    ],
    marker_line_width=0,
    marker_opacity=0.75,
    text=df.county + ', ' + df.state
    + '<br>cases: '
    + np.round(100 * df.p_cases, 1).astype(str) + '%'
    + '<br>deaths: '
    + np.round(100 * df.p_deaths, 1).astype(str) + '%'
    + '<br>fatality rate: '
    + np.round(100 * df.death_rate, 1).astype(str) + '%',
    hoverinfo='text',
))
fig.update_layout(
    mapbox_style='open-street-map',
    mapbox_zoom=3,
    mapbox_center={'lat': 37.0902, 'lon': -95.7129},
)
fig.update_layout(
    margin={ 'r': 0, 't': 0, 'l': 0, 'b': 0 }
)


# helper funcs
def update_source(value):
    """Change data sources to fit selection"""
    global df, source, index, data, labels, zmax

    # match selection
    match value:
        case 'Cumulative': source = 'cumulative'
        case 'Current': source = 'rolling'

    # update source
    df = core.find.data(source=source)

    # configure parameters
    data = [df.p_cases, df.p_deaths, df.death_rate]
    labels = ['p_cases', 'p_deaths', 'death_rate']

    if source == 'rolling':

        data = [
            df['cases_avg_per_100k'],
            df['deaths_avg_per_100k'],
            df['death_rate']
        ]
        labels = [
            'cases_avg_per_100k',
            'deaths_avg_per_100k',
            'death_rate'
        ]

    zmax = [0.5, 0.01, 0.035]
    if source == 'rolling': zmax = [75, 1, 0.035]

    # redraw figure
    fig.update_traces(
        locations=df.fips,
        z=data[index],
        zmax=zmax[index],
        text=df.county + ', ' + df.state
        + '<br>cases: '
        + np.round(data[0], 1).astype(str) + '/100k'
        + '<br>deaths: '
        + np.round(data[1], 1).astype(str) + '/100k'
        + '<br>fatality rate: '
        + np.round(100 * data[2], 1).astype(str) + '%',
    )
    fig.update_layout(
        mapbox_style='open-street-map',
        mapbox_zoom=zoom,
        mapbox_center=center,
    )

    return fig

def change_map_view(value):
    """Change map center and zoom depending on selection"""
    global center, zoom

    # default center, zoom
    center = {'lat': 37.0902, 'lon': -95.7129}
    zoom = 3

    # match selection
    match value:
        case 'Contiguous U.S.':
            pass
        case 'Alaska':
            center = {'lat': 63.3850, 'lon': -152.2683}
            zoom = 2
        case 'Hawaii':
            center = {'lat': 19.8983, 'lon': -155.5822}
            zoom = 5
        case 'Puerto Rico & the U.S. Virgin Islands':
            center = {'lat': 18.4389, 'lon': -66.0079}
            zoom = 6.5
        case 'Northern Mariana Islands':
            center = {'lat': 15.2, 'lon': 145.75}
            zoom = 7

    # update layout
    fig.update_layout(
        mapbox_style='open-street-map',
        mapbox_zoom=zoom,
        mapbox_center=center,
    )

    return fig

def change_choropleth(value):
    """Change choropleth data to match selection"""
    global index

    # get appropriate data source
    index = 0

    # match selection
    match value:
        case 'Cases': pass
        case 'Fatalities': index = 1
        case 'Fatality Rate': index = 2

    # change choropleth data
    fig.update_traces(
        z=data[index],
        zmax=zmax[index],
    )
    fig.update_layout(
        mapbox_style='open-street-map',
        mapbox_zoom=zoom,
        mapbox_center=center,
    )

    return fig

def generate_info(src, map, choro):
    """Generate info text based on selection"""

    # defaults
    grouping = 'cumulative totals'
    subdivision = 'counties'
    region = 'the contiguous U.S'
    data = 'cases'
    format = 'as percentage of total population'

    # match data source
    match src:
        case 'Cumulative': pass
        case 'Current':
            grouping = 'rolling averages from the past 7 days'
            format = 'per 100k people'

    # match map view
    match map:
        case 'Contiguous U.S.': pass
        case 'Alaska':
            subdivision = 'boroughs and census-designated areas'
            region = 'Alaska'
        case 'Hawaii':
            region = 'Hawaii'
        case 'Puerto Rico & the U.S. Virgin Islands':
            subdivision = 'municipalities'
            region = 'Puerto Rico & the U.S. Virgin Islands'
        case 'Northern Mariana Islands':
            subdivision = 'municipalities'
            region = 'the Northern Mariana Islands'

    # match choropleth data
    match choro:
        case 'Cases': pass
        case 'Fatalities': data = 'deaths'
        case 'Fatality Rate':
            data = 'fatality rate'
            format = 'as percentage of total cases'

    # generate info text
    text = [
        f'Viewing {grouping} for all {subdivision} in {region}.',
        html.Br(), f'Showing {data} {format}.',
    ]

    return text

def format_data(col, index):
    """Format data column for plotly display"""

    label = labels[index]
    match label:
        case 'p_cases' | 'p_deaths' | 'death_rate':
            return np.round(col * 100, 1).astype(str) + '%'
        case 'cases_avg_per_100k' | 'deaths_avg_per_100k':
            return np.round(col, 1).astype(str) + '/100k'

def format_date(col):
    """Format date column (as list of strings) for plotly display"""

    # convert string of format '%Y-%m-%d' to date object
    date = to_datetime(col)
    return date.dt.strftime('%-m/%-d')

def get_forecast_data(fips):
    """Get forecast data for a specific FIPS code"""
    data = core.find.historical(fips, source='cumulative')
    return data.drop(columns=['county', 'state', 'fips'])

def to_series(predictions, dates, n, source):
    """Turn predictions into formatted series and rearrange"""

    def frame(cols, names, dates):
        """Put columns into data frames and format"""
        out = []
        for i, col in enumerate(cols):
            # match scaling
            if source == 'rolling' and index in [0, 1]:
                out.append(DataFrame({
                    'date': dates[:len(col)],
                    names[i]: 100 * col / n
                }))
            else:
                out.append(DataFrame({
                    'date': dates[:len(col)],
                    names[i]: col / n
                }))

        return out

    if source == 'historical':
        active, recovered = frame(
            [predictions[0], predictions[2]],
            ['active', 'recovered'],
            dates
        )
        return active, recovered

    last = to_datetime(dates.tail(1).values[0]) \
        - timedelta(days=params['delay'])
    future = [
        last + timedelta(days=i + 1)
        for i in range(14 + params['delay'])
    ]
    predictions = np.array(predictions)

    match forecast['model']:

        case 'SIR':
            infected, removed = frame(
                [predictions[:, 1], predictions[:, 2]],
                ['infected (predicted)', 'removed (predicted)'],
                future
            )
            return infected, removed

        case 'SEIR':
            exposed, infected, removed = frame(
                [predictions[:, 1], predictions[:, 2], predictions[:, 3]],
                [
                    'exposed (predicted)', 'infected (predicted)',
                    'removed (predicted)'
                ],
                future
            )
            return exposed, infected, removed

        case 'SIRD':
            infected, recovered, dead = frame(
                [predictions[:, 1], predictions[:, 2], predictions[:, 3]],
                [
                    'infected (predicted)', 'recovered (predicted)',
                    'dead (predicted)'
                ],
                future
            )
            return infected, recovered, dead

        case 'SEIRD':
            exposed, infected, recovered, dead = frame(
                [
                    predictions[:, 1],
                    predictions[:, 2],
                    predictions[:, 3],
                    predictions[:, 4]
                ],
                [
                    'exposed (predicted)', 'infected (predicted)',
                    'recovered (predicted)', 'dead (predicted)'
                ],
                future
            )
            return exposed, infected, recovered, dead

def create_seird(r_0, gamma, n, alpha, rho, delta):
    """Create and returned a pre-compiled SEIRD model"""

    # compile compartments
    susceptible = comps.Susceptible(r_0, gamma, n)
    exposed = comps.Exposed()
    infected = comps.Infected()
    recovered = comps.Recovered()
    dead = comps.Dead()

    # compile parameters
    matrix = np.empty((5, 5), dtype=tuple)
    matrix.fill((1.0, 1.0))  # default probability and rate

    matrix[1][2] = (1, delta)

    recovery_rate = (gamma - alpha * rho) / (1 - alpha)
    matrix[2][3] = (1 - alpha, recovery_rate)  # I => R
    matrix[2][4] = (alpha, rho)  # I => D

    # compile model
    seird_model = models.Model(n)
    seird_model.add(susceptible, [1], matrix[0])
    seird_model.add(exposed, [2], matrix[1])
    seird_model.add(infected, [3, 4], matrix[2])
    seird_model.add(recovered, [], matrix[3])
    seird_model.add(dead, [], matrix[4])
    seird_model.compile()

    return seird_model

def forecast_historical(data):
    """Generate historical forecasts of other compartments"""

    # process available data
    total_infected = normalize.count(
        data['cases'], params['undercount']
    )
    total_fatalities = normalize.count(
        data['deaths'], params['undercount']
    )
    infected_deltas = normalize.deltas(total_infected)
    fatalities_deltas = normalize.deltas(total_fatalities)

    # normalize data
    infected = normalize.active(
        infected_deltas, round(1 / params['gamma_inf']), delay=params['delay']
    )
    infected_deltas = normalize.shift(
        infected_deltas, params['delay']
    )
    fatalities_deltas = normalize.shift(
        fatalities_deltas, params['delay']
    )

    # extract missing data
    fatalities_deltas = normalize.bound(
        infected, infected_deltas, fatalities_deltas
    )
    recovered_deltas = normalize.recovered(
        infected, infected_deltas, fatalities_deltas
    )

    # get cumulative data
    fatalities = normalize.cumulative(fatalities_deltas)
    recovered = normalize.cumulative(recovered_deltas)

    return infected, fatalities, recovered

def forecast_all(historical, n):
    """Generate predictive forecasts for all compartments"""

    # process available data
    infected, fatalities, recovered = historical
    infected = infected[-1]
    fatalities = fatalities[-1]
    recovered = recovered[-1]
    remaining = n - (infected + fatalities + recovered)

    # get parameter set
    param_set = None
    match forecast['behavior']:
        case 'Low Transmission': param_set = params['low']
        case 'Average': param_set = params['average']
        case 'High Transmission': param_set = params['high']

    # initialize model
    model = None
    state = None

    match forecast['model']:
        case 'SIR':
            model = pre.sir(param_set['R_0'], params['gamma_inf'], n)
            state = [remaining, infected, fatalities + recovered]
        case 'SEIR':
            model = pre.seir(
                param_set['R_0'], params['gamma_inf'], n,
                param_set['delta']
            )
            state = [remaining, 0, infected, fatalities + recovered]
        case 'SIRD':
            model = pre.sird(
                param_set['R_0'], params['gamma_inf'], n,
                param_set['alpha'], param_set['rho']
            )
            state = [remaining, infected, recovered, fatalities]
        case 'SEIRD':
            model = create_seird(
                param_set['R_0'], params['gamma_inf'], n,
                param_set['alpha'], param_set['rho'],
                param_set['delta']
            )
            state = [remaining, 0, infected, recovered, fatalities]

    # get predictions
    predicted = model.integrate(
        range(14 + params['delay']),
        starting_state=np.array(state)
    )
    return predicted

def add_to_figure(fig, series):
    """Add one or more series to the figure"""

    def scale(k):
        # match scaling
        if source == 'rolling' and index in [0, 1]:
            return k * 100
        return k

    format_scale = lambda k: np.round(k * 100, 1).astype(str) + '%'

    for col in series:
        fig.add_trace(go.Scatter(
            x=col['date'],
            y=scale(col.iloc[:, 1]),
            name=col.columns[1],
            mode='lines+markers',
            text=format_date(col['date']) + ': '
            + format_scale(col.iloc[:, 1]),
            hoverinfo='text',
        ))

def run_forecast(fig, fips):
    """"Run a forecast and add its results to the county graph"""
    data = get_forecast_data(fips)
    population = data['population'].values[0]

    historical = forecast_historical(data)
    series = to_series(historical, data['date'], population, 'historical')
    add_to_figure(fig, series)

    if forecast['extent'] == 'Historical':
        return fig

    predictions = forecast_all(historical, population)
    series = to_series(predictions, data['date'], population, 'all')
    add_to_figure(fig, series)
    return fig


# callbacks
@app.callback(
    [
        Output('graph', 'figure'),
        Output('info', 'children'),
    ],
    [
        Input('source-dropdown', 'value'),
        Input('map-dropdown', 'value'),
        Input('choropleth-dropdown', 'value')
    ]
)
def update_figure(src_drop, map_drop, choro_drop):
    """Responsible for all updates to the main figure"""

    ids = list(ctx.triggered_prop_ids.values())
    if len(ids) == 0: return no_update
    id = ids[0]

    out = no_update

    match id:
        case 'source-dropdown':
            out = update_source(src_drop)
        case 'map-dropdown':
            out = change_map_view(map_drop)
        case 'choropleth-dropdown':
            out = change_choropleth(choro_drop)

    info_out = generate_info(src_drop, map_drop, choro_drop)
    return out, info_out

@app.callback(
    [
        Output('county-info-name', 'children'),
        Output('county-graph-container', 'children')
    ],
    Input('graph', 'clickData')
)
def update_county(click_data):
    """Responsible for updating the county popup"""

    # get info
    if click_data is None:
        return no_update

    fips = click_data['points'][0]['location']

    # process county data
    data = core.find.historical(fips, source=source)
    name = data['county'].values[0] + ', ' + data['state'].values[0]

    # generate figure
    fig = go.Figure(go.Scatter(
        x=data['date'],
        y=data[labels[index]],
        name='data',
        mode='lines+markers',
        text=format_date(data['date']) + ': '
        + format_data(data[labels[index]], index),
        hoverinfo='text',
    ))
    fig.update_layout(
        template='simple_white',
    )

    # add forecasts
    if forecast['extent'] != 'None':
        run_forecast(fig, fips)

    return name, dcc.Graph(figure=fig, id='county-graph')

@app.callback(
    Output('void-forecast', 'children'),
    [
        Input('forecast-extent', 'value'),
        Input('forecast-model', 'value'),
        Input('forecast-behavior', 'value')
    ]
)
def update_forecast(extent, model, behavior):
    """Modify forecasting parameters"""
    global forecast
    forecast = {
        'extent': extent,
        'model': model,
        'behavior': behavior,
    }
    return no_update


# create app layout
app.layout = html.Div(children=[
    html.H1(children='COVID-19 Notebook'),
    html.Div(children='''
        An interactive notebook for examining trends in COVID-19 cases
    ''', id='subtitle'),
    dcc.Dropdown(
        ['Cumulative', 'Current'], 'Cumulative',
        id='source-dropdown'
    ),
    dcc.Dropdown([
        'Contiguous U.S.', 'Alaska', 'Hawaii',
        'Puerto Rico & the U.S. Virgin Islands',
        'Northern Mariana Islands'
    ], 'Contiguous U.S.', id='map-dropdown'),
    dcc.Dropdown(
        ['Cases', 'Fatalities', 'Fatality Rate'], 'Cases',
        id='choropleth-dropdown'
    ),
    html.Div(children=[
        dcc.Graph(figure=fig, id='graph'),
        html.Div(children=[
            html.H2(children='No county selected.', id='county-info-name'),
            html.Div(children=[], id='county-graph-container'),
        ], id='county-info'),
    ], id='graph-container'),
    html.H2(children='Forecasting Options'),
    html.Div(children=[
        html.Div(children=[
            html.H3(children='Extent'),
            dcc.RadioItems(
                ['None', 'Historical', 'Comprehensive'],
                'None', id='forecast-extent'
            ),
        ], className='forecasting-option'),
        html.Div(children=[
            html.H3(children='Model'),
            dcc.RadioItems(
                ['SIR', 'SIRD', 'SEIR', 'SEIRD'],
                'SIR', id='forecast-model'
            ),
        ], className='forecasting-option'),
        html.Div(children=[
            html.H3(children='Behavior'),
            dcc.RadioItems(
                ['Low Transmission', 'Average', 'High Transmission'],
                'Average', id='forecast-behavior'
            ),
        ], className='forecasting-option'),
    ], id='forecasting-options'),
    html.Div(children=[
        'Viewing cumulative totals for all counties in the contiguous U.S.',
        html.Br(), 'Showing cases as percentage of total population.'
    ], id='info'),
    dcc.Markdown(
        children='Data from *The New York Times*, based on reports from state '
        + 'and local health agencies.  \n'
        + 'See also: '
        + '<https://www.nytimes.com/interactive/2020/us/coronavirus-us-cases'
        + '.html>.  \n'
        + f'Last updated {core.get.last_update()}, at midnight UTC.',
        id='footer'
    ),
    # for callbacks w/ no output
    html.Div(id='void-forecast', style={ 'display': 'none' })
])


# run app
if __name__ == '__main__':
    app.run_server(debug=True)