import pandas as pd
import numpy as np


def read_all(data_folder):
    """
    Read all of the data and return a series of pandas data frames
    
    Example usage:
    df_cgm, df_bolus, df_basal, df_insulin = read_all(r"data")
    
    Args:
        data_folder (str): path to the root folder containing all the data files. The file names 
        and structure should be left exactly as they were in the initial download from Glooko.
        
    Returns:
        A 4-element tuple
        
        - **df_cgm** (pandas df): pandas dataframe containing CGM time series data
        - **df_bolus** (pandas df): Bolus data
        - **df_basal** (pandas df): Basal data
        - **df_insulin** (pandas df): Insulin corrections data
    
    """
    # Load and format CGM data
    df_cgm_data = pd.read_csv(data_folder + r"/cgm_data.csv", header=1,\
        names=["time", "bg", "sn_cgm"])
    df_cgm_data["time"] = pd.to_datetime(df_cgm_data["time"])
    
    # Load and format bolus data
    df_bolus_data = pd.read_csv(data_folder + r"/Insulin data/bolus_data.csv", header=1, \
        names=["time", "insulin_type", "bg_input", "carbs_input", "carb_ratio",\
            "insulin_delivered", "initial_delivery", "extended_delivery", "sn_omni"])
    df_bolus_data["time"] = pd.to_datetime(df_bolus_data["time"])

    # Load and format basal data
    df_basal_data = pd.read_csv(data_folder + r"/Insulin data/basal_data.csv", header=1,\
        names=["time", "insulin_type", "duration", "percentage", "rate", "insulin_delivered",\
            "sn_omni"])
    df_basal_data["time"] = pd.to_datetime(df_basal_data["time"])

    # Load and format insulin data
    df_insulin_data = pd.read_csv(data_folder + r"/Insulin data/insulin_data.csv", header=1,\
        names=["time", "total_bolus", "total_insulin", "total_basal", "sn_omni"])
    df_insulin_data["time"] = pd.to_datetime(df_insulin_data["time"])

    return df_cgm_data, df_bolus_data, df_basal_data, df_insulin_data


# Load all of the data into pandas dataframes
df_cgm, df_bolus, df_basal, df_insulin = read_all(r"../data")


df_bolus["carb_correction"] = np.divide(df_bolus["carbs_input"], df_bolus["carb_ratio"])
df_bolus["insulin_correction"] = df_bolus["insulin_delivered"] - df_bolus["carb_correction"]


import hvplot.pandas #noqa
import holoviews as hv

# Use holoviews to quicky plot CGM data
df_cgm.hvplot.line(x='time', y='bg', 
                   ylabel='Blood glucose (mg/dL)', xlabel='Time', 
                   height=500, width=620, color='lightgray')*\
df_cgm.hvplot.scatter(x='time', y='bg')*\
hv.HLine(150).opts(
    color='k', 
    line_dash='dashed', 
    line_width=2.0,
)


import matplotlib.pyplot as plt
%matplotlib widget

# start by taking the diff of the CGM data (compute the derivative)
df_cgm["d_bg"] = [0] + np.diff(df_cgm["bg"]).tolist()

# Plot diff and cgm data
fig,ax = plt.subplots(2,1, sharex=True)

ax[0].plot(df_cgm["time"], df_cgm["bg"],'.-')
ax[0].grid(True)
ax[0].set_title('CGM data')
ax[0].set_ylabel('Blood glucose (mg/dL')

ax[1].plot(df_cgm["time"], df_cgm["d_bg"],'.-')
ax[1].set_ylim([-50,50])
ax[1].grid(True)
ax[1].set_title('d_cgm/d_t')
ax[1].set_ylabel('BG (mg/dL) - difference')

fig.tight_layout()


from scipy.ndimage import gaussian_filter1d

g_filter = gaussian_filter1d(df_cgm['bg'],4)
df_cgm['bg_filt'] = g_filter

fig2, ax2 = plt.subplots(1,1)
ax2.plot(df_cgm['time'], df_cgm['bg'], 'k', label='Original')
ax2.plot(df_cgm['time'], g_filter, '--r', label='Filtered')
ax2.set_xlim([19402.098437682915, 19403.020563564292])
ax2.set_title('Gaussian filtering')
ax2.set_ylabel('Blood glucose (mg/dL)')
ax2.set_xlabel('Time')
ax2.tick_params(rotation=45)
ax2.grid()

fig2.tight_layout()


# Re-calculate the diff data using the filtered CGM data

df_cgm["d_bg"] = [0] + np.diff(df_cgm["bg_filt"]).tolist()

# Plot filtered CGM data with differenced data
fig3,ax3 = plt.subplots(2,1, sharex=True)

ax3[0].plot(df_cgm["time"], df_cgm["bg_filt"],'.-')
ax3[0].grid(True)
ax3[0].set_title('CGM data')
ax3[0].set_ylabel('Blood glucose (mg/dL')

ax3[1].plot(df_cgm["time"], df_cgm["d_bg"],'.-')
ax3[1].plot([np.min(df_cgm["time"]), max(df_cgm["time"])], [0, 0], 'r-', linewidth=2)
ax3[1].set_ylim([-10,10])
ax3[1].grid(True)
ax3[1].set_title('d_cgm/d_t')
ax3[1].set_ylabel('BG (mg/dL) - difference')
ax3[1].set_xlim([19402.098437682915, 19403.020563564292])
ax3[1].tick_params(rotation=45)

fig3.tight_layout()

Part 1: Getting started

Bolus data¶

Extracting key information¶