util.py

import math
import numpy as np
import pandas as pd
import geopandas as gpd
import pandas_bokeh
from pandas_bokeh.geoplot import convert_geoDataFrame_to_patches

from functools import partial
from datetime import datetime, timedelta
from bokeh.io import curdoc
from bokeh.layouts import layout, gridplot, column, row
from bokeh.models import Button, Toggle, CategoricalColorMapper, ColumnDataSource, TableColumn, DataTable, HoverTool, Label, SingleIntervalTicker, Slider, Spacer, GlyphRenderer, DatetimeTickFormatter, DateRangeSlider, DataRange1d, Range1d, DateSlider, LinearColorMapper, Div, CustomJS, Band, HTMLTemplateFormatter, StringFormatter, Scatter, Slope
from bokeh.palettes import Inferno256, Magma256, Turbo256, Plasma256, Cividis256, Viridis256, OrRd
from bokeh.plotting import figure
from bokeh.events import DocumentReady

# import configuration variables
from config import *

# utility functions


# log the current time and the difference from a reference time
def print_time( reference_time, label ):

    current_time = datetime.now()
    delta = current_time - reference_time
    delta = delta - timedelta(microseconds=delta.microseconds)

    print(current_time, 'elapsed time at', label, delta)


# because spaces are gone once a string is inserted into HTML
def make_html_integer( value ):

    value_with_commas = format(value, ',d')
    value_html = value_with_commas.replace(',', '&nbsp;')

    return value_html


def make_interval_str( title, value, value_l, value_r ):

    str_interval = title + str(value) + ' (' + str(value_l) + '  -  ' + str(value_r) + ')'

    return str_interval


def make_plot( name, title, range, x_axis_type='auto', height=PLOT_HEIGHT, width=PLOT_WIDTH ):
    return figure(plot_height=height, plot_width=width, title=title, tools=PLOT_TOOLS, x_range=[0, range], name=name, x_axis_type=x_axis_type)


# because there are several ways to achieve this, let's encapsulate
def make_data_source( datax, datay ):
    return ColumnDataSource(data=dict(x=datax, y=datay))


def make_data_source2( datax, datay, datay2 ):
    return ColumnDataSource(data=dict(x=datax, y=datay, y2=datay2))


# receives a list of lists on for y0, y1, y2, ....
def make_data_source_multi( datax, datay_list ):

    length = len(datay_list)
    data_dict = {}
    data_dict['x'] = datax
    for j in range(0, length):
        key = 'y' + str(j)
        data_dict[key] = datay_list[j]

    return data_dict


# create a data source based on dates
def make_data_source_dates( dates, datay, datay2=None ):

    if datay2:
        df = pd.DataFrame(data={ 'x': dates, 'y': datay, 'y2': datay2 }, columns=['x', 'y', 'y2'])
    else:
        df = pd.DataFrame(data={ 'x': dates, 'y': datay }, columns=['x', 'y'])

    return ColumnDataSource(df)


# receives a list of lists on for y0, y1, y2, ....
def make_data_source_multi_dates( datax, datay_list ):

    length = len(datay_list)
    columns = []
    data_dict = {}
    data_dict['x'] = datax
    columns.append('x')
    for j in range(0, length):
        key = 'y' + str(j)
        data_dict[key] = datay_list[j]
        columns.append(key)

    df = pd.DataFrame(data=data_dict, columns=columns)

    return ColumnDataSource(df)


# generate the labels for the age stratified plots
def make_age_labels( nr_labels, nr_series ):

    labels = []
    for j in range(0, nr_series):
        if j == nr_series - 1:
            labels.append('>= ' + str( j * 10 ) )
        else:
            labels.append(str( j * 10 ) + '-' + str( (j  + 1) * 10 - 1 ))

    return labels


# create the map plot, using Pandas-Bokeh
def make_map_plot( data ):

    hover_string = [ ('County', '@NAME_2'), ('Incidence', '@incidence'), ]

    # According to the docs the colormap parameter of the plot_bokeh function:
    # "Defines the colors to plot. Can be either a list of colors or the name of a Bokeh color palette"

    # because our original palette has the colors in the wrong direction
    # and because of this https://github.com/bokeh/bokeh/issues/7297
    # we can't just invert the colormap_range or we loose the legend on the color bar
    # so we we are forced to reverse the palette manually

    colormap = reverse_palette(OrRd)[MAP_INCIDENCE_RESOLUTION]

    # we now create a plot based on a geodataframe to which an incidence column has been added
    # https://patrikhlobil.github.io/Pandas-Bokeh/#geoplots
    aplot = data.plot_bokeh( name='themap', title=MAP_TITLE, category='incidence', hovertool=True, colormap=colormap, colormap_range=(MAP_INCIDENCE_MIN, MAP_INCIDENCE_MAX),
                             hovertool_string=hover_string, legend=False, figsize=(MAP_WIDTH, MAP_HEIGHT), simplify_shapes=MAP_RESOLUTION, tile_provider=MAP_TILE_PROVIDER)

    # we are selecting the plot by name and then getting the data_source
    # the name was given in the invocatino of plot_bokeh
    data_source = aplot.select(name='themap').data_source

    # remove the interactions and decorations
    aplot.toolbar.active_drag   = None
    aplot.toolbar.active_scroll = None
    aplot.toolbar.active_tap    = None

    aplot.toolbar_location = None

    aplot.xaxis.visible = False
    aplot.yaxis.visible = False

    return aplot, data_source


# create table with summary statistics
def make_stats_table( width, height, alignment ):

    # we initialize this with dummy values
    stats_data   = pd.DataFrame( { 'updated': '01-01-1970', 'sum_new': [0], 'sum_cv19_deaths': [0], 'sum_total_deaths': [0], 'sum_avg_deaths': [0], 'excess_deaths': [0], 'excess_deaths_pct': [0] } )
    stats_source = ColumnDataSource(stats_data)

    # the colors match the plot titles and the main plot lines, respectively
    formatter_template  = """<div style="font-size: 188%; font-weight: bold; padding-top: 7px; color: #4d4d4d" ><%= value %></div>"""
    formatter_template2 = """<div style="font-size: 188%; font-weight: bold; padding-top: 7px; color: #b3b3b3" ><%= value %></div>"""

    my_formatter  = HTMLTemplateFormatter(template=formatter_template )
    my_formatter2 = HTMLTemplateFormatter(template=formatter_template2)

    base_colum_width = 105

    # we will define a per column width
    # reference: http://docs.bokeh.org/en/latest/docs/reference/models/widgets.tables.html#bokeh.models.widgets.tables.TableColumn

    stats_columns = [
        TableColumn(field="sum_new",           title="Cases" ,                  formatter=my_formatter,  sortable=False, width=base_colum_width      ),
        TableColumn(field="sum_cv19_deaths",   title="Covid19 deaths",          formatter=my_formatter,  sortable=False, width=base_colum_width      ),
        TableColumn(field="sum_total_deaths",  title="Overall deaths",          formatter=my_formatter,  sortable=False, width=base_colum_width      ),
        TableColumn(field="sum_avg_deaths",    title="Overal deaths 2015-2019", formatter=my_formatter,  sortable=False, width=base_colum_width + 30 ),
        TableColumn(field="excess_deaths",     title="Excess deaths",           formatter=my_formatter,  sortable=False, width=base_colum_width      ),
        TableColumn(field="excess_deaths_pct", title="Excess deaths %",         formatter=my_formatter,  sortable=False, width=base_colum_width      ),
        TableColumn(field="updated",           title="Updated at",              formatter=my_formatter2, sortable=False, width=base_colum_width + 15 ),
    ]

    # the autosize_mode is not useful here because different columns need different widths, the alignement is in relation to the parent widget
    # http://docs.bokeh.org/en/latest/docs/reference/models/widgets.tables.html#bokeh.models.widgets.tables.DataTable
    stats_table = DataTable(source=stats_source, columns=stats_columns, index_position=None, selectable=False, autosize_mode='none', width=width, height=height, align=alignment, row_height=35)

    return stats_table


# create table for overall mortality statistics
def make_mortality_stats_table( width, height, alignment ):

    # we initialize this with dummy values
    dummy_column = [ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 ]
    index_column = [ '<1', '1-4', '5-14', '15-24', '25-34', '35-44', '45-54', '55-64', '65-74', '75-84', '>85', 'all ages', 'all ages *' ]

    stats_data   = pd.DataFrame( { 'age_group': index_column, 'sum_total_deaths': dummy_column, 'sum_avg_deaths': dummy_column, 'excess_deaths': dummy_column, 'excess_deaths_pct': dummy_column } )

    stats_source = ColumnDataSource(stats_data)

    # the colors match the plot titles and the main plot lines, respectively
    formatter_template_index = """<div style="font-size: 130%; font-family: 'Courier New', monospace; font-weight: bold;   padding-top: 3px; height: 15px; color: #4d4d4d" ><%= value %></div>"""
    formatter_template       = """<div style="font-size: 130%; font-family: 'Courier New', monospace; font-weight: normal; padding-top: 3px; height: 15px; color: #4d4d4d" ><%= value %></div>"""

    my_formatter_index = HTMLTemplateFormatter(template=formatter_template_index )
    my_formatter       = HTMLTemplateFormatter(template=formatter_template )

    base_colum_width = 70

    # we will define a per column width
    # reference: http://docs.bokeh.org/en/latest/docs/reference/models/widgets.tables.html#bokeh.models.widgets.tables.TableColumn

    stats_columns = [
        TableColumn(field="age_group",         title="Age Group",                formatter=my_formatter_index,  sortable=False, width=base_colum_width + 25 ),
        TableColumn(field="sum_total_deaths",  title="Overall deaths",           formatter=my_formatter,        sortable=False, width=base_colum_width + 10 ),
        TableColumn(field="sum_avg_deaths",    title="Overall deaths 2015-2019", formatter=my_formatter,        sortable=False, width=base_colum_width + 70 ),
        TableColumn(field="excess_deaths",     title="Excess deaths",            formatter=my_formatter,        sortable=False, width=base_colum_width + 10 ),
        TableColumn(field="excess_deaths_pct", title="Excess deaths %",          formatter=my_formatter,        sortable=False, width=base_colum_width + 20 ),
    ]

    # the autosize_mode is not useful here because different columns need different widths, the alignement is in relation to the parent widget
    # http://docs.bokeh.org/en/latest/docs/reference/models/widgets.tables.html#bokeh.models.widgets.tables.DataTable
    stats_table = DataTable(source=stats_source, columns=stats_columns, index_position=None, selectable=False, autosize_mode='none', width=width, height=height, align=alignment)

    return stats_table


# set properties common to all the plots based on linear xaxis
def set_plot_details( aplot, xlabel=PLOT_X_LABEL, ylabel=PLOT_Y_LABEL, xtooltip_format="@x{0}", ytooltip_format="@y{0}", tooltip_mode='vline', show_x_label=True, show_y_label=False, ylabel2=PLOT_Y_LABEL, ytooltip_format2=None, tooltip_line=None, show_x_axis=True, ylabel3=PLOT_Y_LABEL, ytooltip_format3=None ):
    aplot.toolbar.active_drag    = None
    aplot.toolbar.active_scroll  = None
    aplot.toolbar.active_tap     = None

    # add the hover tool
    tooltip_attachment = 'left'
    tooltip_list = [ (xlabel, xtooltip_format), (ylabel, ytooltip_format), ]
    tooltip_formatters = {'@x': 'datetime'}

    # check if we have a second line for tooltips
    if ytooltip_format2:
        tooltip_list.append( (ylabel2, ytooltip_format2) )

    # same for 3rd
    if ytooltip_format3:
        tooltip_list.append( (ylabel3, ytooltip_format3) )

    # we pass a single render to anchor the tooltip to a specific line
    if tooltip_line:
        ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, formatters=tooltip_formatters, renderers=[ tooltip_line ])
    else:
        rlist  = aplot.select(dict(type=GlyphRenderer))
        if len(rlist) > 0:
            ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, formatters=tooltip_formatters, renderers=[ rlist[0] ])
        else:
            # this only happens if we have a plot that has not lines yet, but it is here to prevent a crash
            print('This is probably a plot with no line')
            ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, )

    ahover.point_policy = 'snap_to_data'
    ahover.line_policy  = 'nearest'
    aplot.add_tools(ahover)
    aplot.toolbar.active_inspect = ahover

    # control placement / visibility of toolbar
    aplot.toolbar_location = None

    # labels
    if show_x_label:
        aplot.xaxis.axis_label = xlabel
    if show_y_label:
        aplot.yaxis.axis_label = ylabel

    aplot.xaxis.visible = show_x_axis


# set properties common to all the plots with multiple lines
def set_plot_details_multi( aplot, xlabel=PLOT_X_LABEL, ylabels=[], xtooltip_format="@x{0}", tooltip_mode='vline', tooltip_line=None, extra_precision=False, show_x_axis=False, extra_tooltip=None ):
    aplot.toolbar.active_drag    = None
    aplot.toolbar.active_scroll  = None
    aplot.toolbar.active_tap     = None

    # add the hover tool
    tooltip_attachment = 'left'
    tooltip_list = [ (xlabel, xtooltip_format) ]
    tooltip_formatters = {'@x': 'datetime'}

    nr_series = len(ylabels)
    j = 0
    for label in ylabels:
        if extra_precision:
            ytooltip_format = "@y" + str(j) + "{0.00}"
        else:
            ytooltip_format = "@y" + str(j) + "{0}"
        j = j + 1
        tooltip_list.append( (label, ytooltip_format ) )

    # add an extra custom tooltip for a custom line, if passed as an argument
    if extra_tooltip is not None:
        tooltip_list.append(extra_tooltip)

    # we pass a single render to anchor the tooltip to a specific line
    if tooltip_line:
        ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, formatters=tooltip_formatters, renderers=[ tooltip_line ])
    else:
        rlist  = aplot.select(dict(type=GlyphRenderer))
        if len(rlist) > 0:
            ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, formatters=tooltip_formatters, renderers=[ rlist[0] ])
        else:
            # this only happens if we have a plot that has not lines yet, but it is here to prevent a crash
            print('This is probably a plot with no line')
            ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, )

    ahover.point_policy = 'snap_to_data'
    ahover.line_policy  = 'nearest'
    aplot.add_tools(ahover)
    aplot.toolbar.active_inspect = ahover

    # control placement / visibility of toolbar
    aplot.toolbar_location = None

    # labels
    aplot.xaxis.visible = show_x_axis

    aplot.legend.location = 'top_left'
    aplot.legend.click_policy = 'mute'

    aplot.legend.label_text_font_size = PLOT_LEGEND_FONT_SIZE
    aplot.legend.spacing = PLOT_LEGEND_SPACING


def set_plot_date_details( aplot, date_series, length, asource=None ):

    aplot.xaxis.formatter = DatetimeTickFormatter( months=["%b %Y"], years=["%b %Y"], )

    aplot.x_range.start = date_series[0]          - datetime(1970, 1, 1).date()
    aplot.x_range.end   = date_series[length - 1] - datetime(1970, 1, 1).date()

    aplot.xaxis.major_label_orientation = math.pi / 4

    if asource:
        y_min, y_max = get_y_limits(asource, date_series[0 + DATE_IGNORE], date_series[length - 1])
        range_delta = y_max * PLOT_RANGE_FACTOR

        # this thing alone prevents an interference from toggling the visibility of clines
        # and the scale of the plots; comment this line and you will see :-)
        # reference:
        # https://discourse.bokeh.org/t/autoscaling-of-axis-range-with-streaming-multiline-plot-with-bokeh-server/1284/2?u=comperem
        aplot.y_range = Range1d(y_min - range_delta , y_max + range_delta)


# this function iterates across the several resolutions (color sets) of a bokeh palette
# and reverses their order
def reverse_palette( original_palette ):

    palette = { }
    base_value = 3
    for item in original_palette.items():
        # print(base_value, item)
        palette[base_value] = item[1][::-1]
        base_value = base_value + 1

    return palette


# calculate a value range adapted to the values present in the date range
def get_y_limits( source, date_i, date_f ):

    # calculate indexes in the y data
    y_i = np.where( source.data['x'] == date_i )[0][0]
    y_f = np.where( source.data['x'] == date_f )[0][0]

    # get min and max iterating over the plot series
    y_max_list = []
    y_min_list = []
    for s in source.data:
        # x and index are also sries in the data source, let's ignore them
        if s == 'x' or s == 'index':
            continue
        y_max_list.append( np.nanmax(source.data[s][y_i:y_f]) )
        y_min_list.append( np.nanmin(source.data[s][y_i:y_f]) )

    # return the minimum of the minimuns for the interval, same for maximum
    return min(y_min_list), max(y_max_list)


# make specific plot for mortality comparisons
def make_mortality_plot( data_dates, data_total_deaths, data_avg_deaths, data_avg_deaths_inf, data_avg_deaths_sup, days, name ):

    df = pd.DataFrame(data={ 'x': data_dates, 'y': data_total_deaths, 'y2': data_avg_deaths, 'y3': data_avg_deaths_inf, 'y4': data_avg_deaths_sup }, columns=['x', 'y', 'y2', 'y3', 'y4'])
    data_source = ColumnDataSource(df)

    aplot = figure(plot_height=PLOT_HEIGHT4, plot_width=PLOT_WIDTH4, title='Overall deaths by age group', tools=PLOT_TOOLS, x_range=[0, days], name=name, x_axis_type='auto', sizing_mode='scale_width', max_width=PLOT_WIDTH4 )

    aplot_line1 = aplot.line('x', 'y',  source=data_source, line_width=PLOT_LINE_WIDTH, line_alpha=PLOT_LINE_ALPHA, line_color=PLOT_LINE_COLOR, legend_label='Current' )
    aplot_line2 = aplot.line('x', 'y2', source=data_source, line_width=1, line_alpha=PLOT_LINE_ALPHA, line_color=PLOT_LINE_COLOR_REFERENCE, legend_label='2015-2019 ± SD' )

    my_band = Band(base='x', lower='y3', upper='y4', source=data_source, level='underlay', line_width=1, line_color=PLOT_LINE_COLOR_HIGHLIGHT, fill_color=PLOT_LINE_COLOR_HIGHLIGHT, line_alpha=PLOT_LINE_ALPHA, fill_alpha=PLOT_LINE_ALPHA)
    aplot.add_layout(my_band)

    aplot.legend.location = 'top_left'

    set_plot_details(aplot, 'Date', 'Current', '@x{%F}', '@y{0}', 'vline', False, False, '2015-2019', "@y2{0} (@y3{0}-@y4{0})", aplot_line1)
    set_plot_date_details(aplot, data_dates, days, data_source)

    aplot.legend.label_text_font_size = PLOT_LEGEND_FONT_SIZE

    return aplot


# the index of the first non-NaN element
def get_nn_index( data ):

    index = 0
    for element in data:
        if not math.isnan(element):
            # print('first non NaN is index', index)
            return index
        else:
            index = index + 1

    print('did not found any non-NaN element')
    return -1


# return lists without leading NaNs
def get_clean_data( data ):

    index = get_nn_index(data)

    return data[index:]


# creates a correlation description string
def make_correlation_str( slope, intercept, r_value ):

    m = round(slope, 2)
    b = round(intercept, 2)
    R = round(r_value, 2)

    corr_str = 'm=' + str(m) + ' b=' + str(b) + ' R=' + str(R)

    return corr_str


# returns the correlation paramters
def get_correlation_data( datax, datay ):

    fit_results = np.polyfit(datax, datay, 1, full=True)

    slope     = fit_results[0][0]
    intercept = fit_results[0][1]

    # this is not necessary, stays here for reference
    # y_fit = [slope*i + intercept  for i in datax]

    # Pearson correlation coefficient
    # https://realpython.com/numpy-scipy-pandas-correlation-python/#example-numpy-correlation-calculation
    r_value   = np.corrcoef( datax, datay )[0, 1]

    # print('slope', slope, 'intercept', intercept, 'coeff', r_value)

    return slope, intercept, r_value


# make specific correlation plot
def make_correlation_plot( datax, datay, xlabel, ylabel, height, width ):

    source_aplot = make_data_source(datax, datay)

    aplot = make_plot('Deaths correlation', PLOT_CORRELATION_TITLE, max(datax), 'auto', height, width)

    # we want the same limits in both axis
    max_value = max(max(datay), max(datax) )
    margin = 10

    aplot.x_range = Range1d(0, max_value + margin)
    aplot.y_range = Range1d(0, max_value + margin)

    glyph = Scatter(x='x', y='y', marker='dot', size=20, line_color=PLOT_LINE_COLOR, line_alpha=PLOT_LINE_ALPHA)
    aplot.add_glyph(source_aplot, glyph)

    aplot.xaxis.axis_label = xlabel
    aplot.yaxis.axis_label = ylabel

    aplot.toolbar.active_drag   = None
    aplot.toolbar.active_scroll = None
    aplot.toolbar.active_tap    = None
    aplot.toolbar_location      = None

    slope, intercept, r_value = get_correlation_data(datax, datay)

    regression_line = Slope(gradient=slope, y_intercept=intercept, line_color=PLOT_LINE_COLOR_REFERENCE, line_alpha=PLOT_LINE_ALPHA, line_width=PLOT_LINE_WIDTH, line_dash='dashed')

    # this is the y=x line, for reference
    comparison_line = Slope(gradient=1, y_intercept=0, line_color='gray', line_alpha=0.6, line_width=1 )

    aplot.add_layout(regression_line)
    aplot.add_layout(comparison_line)

    label_str = make_correlation_str(slope, intercept, r_value)

    regression_label = Label(x=190, y=5, text=label_str)

    aplot.add_layout(regression_label)

    return aplot, source_aplot, r_value, regression_line, regression_label


# make specific CFR/CHR plots
def make_vacc_risk_plot(data_vacc, type_str, group_str):

    # extract sub dataframes by matching group_str and the date column (called 'data')
    sub_df = data_vacc.loc[:, data_vacc.columns.to_series().str.endswith( (group_str, 'data') )  ]

    date_list = sub_df['data'].values
    aplot = figure(plot_height=PLOT_HEIGHT6, plot_width=PLOT_WIDTH6, title=type_str, x_range=date_list )

    aplot.toolbar.active_drag    = None
    aplot.toolbar.active_scroll  = None
    aplot.toolbar.active_tap     = None
    aplot.toolbar_location       = None

    aplot.xaxis.major_label_orientation = math.pi / 4

    asource = ColumnDataSource(sub_df)

    y_line1 = 'outros_'       + group_str
    y_line2 = 'vac_completa_' + group_str
    y_line3 = 'vac_reforco_'  + group_str
    y_line4 = 'vac_reforco2_' + group_str

    y_line1_legend = 'None / incomplete'
    y_line2_legend = 'Complete'
    y_line3_legend = 'Booster'
    y_line4_legend = 'Booster2'

    line1 = aplot.line(x='data', y=y_line1, source=asource, line_width=PLOT_LINE_WIDTH, line_alpha=PLOT_LINE_ALPHA,  line_color=PLOT_LINE_COLOR,           legend_label=y_line1_legend )
    line2 = aplot.line(x='data', y=y_line2, source=asource, line_width=PLOT_LINE_WIDTH, line_alpha=PLOT_LINE_ALPHA,  line_color=PLOT_LINE_COLOR_HIGHLIGHT, legend_label=y_line2_legend )
    line3 = aplot.line(x='data', y=y_line3, source=asource, line_width=PLOT_LINE_WIDTH, line_alpha=PLOT_LINE_ALPHA,  line_color=PLOT_LINE_COLOR_REFERENCE, legend_label=y_line3_legend )
    line4 = aplot.line(x='data', y=y_line4, source=asource, line_width=PLOT_LINE_WIDTH, line_alpha=PLOT_LINE_ALPHA2, line_color=PLOT_LINE_COLOR_REFERENCE, legend_label=y_line4_legend )

    # prepare the tooltips
    # we need to use the dataframe column names which depend on the group_str parameter
    tooltip_list = [ ('date', '@data'),
                     (y_line1_legend, '@' + y_line1 + '{0.0}%'),
                     (y_line2_legend, '@' + y_line2 + '{0.0}%'),
                     (y_line3_legend, '@' + y_line3 + '{0.0}%'),
                     (y_line4_legend, '@' + y_line4 + '{0.0}%'), ]
    tooltip_formatters = {}

    # the line to which the tooltip attaches and other details
    tooltip_line = line1
    tooltip_attachment = 'right'
    tooltip_mode = 'vline'

    # add the hover tool
    ahover = HoverTool(tooltips=tooltip_list, mode=tooltip_mode, attachment=tooltip_attachment, formatters=tooltip_formatters, renderers=[ tooltip_line ])

    ahover.point_policy = 'snap_to_data'
    ahover.line_policy = 'nearest'
    aplot.add_tools(ahover)
    aplot.toolbar.active_inspect = ahover

    return aplot