run.py

print("Importing modules...")
import os           # Used for analyzing file paths and directories
import csv          # Needed to read in and write out data
import argparse     # Used to parse optional command-line arguments
import warnings
warnings.simplefilter(action='ignore', category=FutureWarning)
# https://stackoverflow.com/questions/15777951/how-to-suppress-pandas-future-warning
# https://stackoverflow.com/questions/18603270/progress-indicator-during-pandas-operations
# https://pypi.org/project/tqdm/#pandas-integration
# Gives warning if tqdm version <4.33.0. Ignore.
# https://github.com/tqdm/tqdm/issues/780
import pandas as pd # Series and DataFrame structures
import numpy as np
import traceback
import time
from datetime import datetime
import getpass
from PIL import Image
import hashlib
import glob
from tqdm import tqdm
import copy
import re

try:
    import matplotlib
    matplotlib.use("Agg") # no UI backend for use w/ WSL
    # https://stackoverflow.com/questions/43397162/show-matplotlib-plots-and-other-gui-in-ubuntu-wsl1-wsl2
    import matplotlib.pyplot as plt # Needed for optional data plotting.
    PLOT_LIB_PRESENT = True
except ImportError:
    PLOT_LIB_PRESENT = False
# https://stackoverflow.com/questions/3496592/conditional-import-of-modules-in-python
print("...done\n")

# global constants: directory structure
RAW_INCA_DIR = "./raw_data/INCA"
RAW_EDAQ_DIR = "./raw_data/eDAQ"
SYNC_DIR = "./sync_data"
PLOT_DIR = "./figs"
# Find Desktop path, default destination for log files.
username = getpass.getuser()
# https://stackoverflow.com/questions/842059/is-there-a-portable-way-to-get-the-current-username-in-python
home = os.path.join("/mnt/c/Users", "%s" % username)
onedrives = [folder for folder in os.listdir(home) if "OneDrive -" in folder][0]
assert len(onedrives) == 1, "Found more than one OneDrive folder. Unhandled exception"
onedrive = onedrives[0]
LOG_DIR = os.path.join(home, "%s", "Desktop" % (username, onedrive))


# global constants: raw data format
INCA_CHANNELS = ["time", "pedal_sw", "engine_spd", "throttle"]
EDAQ_CHANNELS_5 = ["time", "pedal_v", "gnd_speed", "pedal_sw"]
EDAQ_CHANNELS_6 = ["time", "pedal_v", "wtq_RR", "wspd_RR", "wtq_LR", "wspd_LR",
                                                                    "pedal_sw"]
CHANNEL_UNITS = {"time": "s",
                 "pedal_sw": "off/on",
                 "pedal_v": "V",
                 "engine_spd": "rpm",
                 "gnd_speed": "mph",
                 "throttle": "deg",
                 "wtq_RR": "ft-lb",
                 "wtq_LR": "ft-lb",
                 "wspd_RR": "rpm",
                 "wspd_LR": "rpm"
                 }
INCA_HEADER_HT = 5 # how many non-data rows at top of raw INCA file.
EDAQ_HEADER_HT = 1 # how many non-data rows at top of raw eDAQ file.
SAMPLING_FREQ = 100 # Hz

# global constants: vehicle parameters
ROLLING_RADIUS_FACTOR = 0.965
TIRE_DIAM_IN = 18 # inches
AXLE_RATIO = 11.47
GEARBOX_RATIO = 1.95

# Some case-specific constants stored in class definitions


class FilenameError(Exception):
    pass

class DataReadError(Exception):
    pass

class DataSyncError(Exception):
    pass


class RunGroup(object):
    """Represents a collection of runs from the raw_data directory."""
    def __init__(self, process_all=False, start_run=False, verbose=False, warn=False):
        self.verbosity = verbose
        self.warn_p = warn
        # create SingleRun object for each run but don't read in data yet.
        self.build_run_dict()
        self.process_runs(process_all, start_run)

    def build_run_dict(self):
        """Creates dictionary with an entry for each INCA run in raw_data dir."""
        if not os.path.exists(RAW_INCA_DIR):
            raise DataReadError("No raw INCA directory found. Put data in this "
                                                "folder: %s" % RAW_INCA_DIR)
        INCA_files = os.listdir(RAW_INCA_DIR)
        INCA_files.sort()
        self.run_dict = {}

        for i, file in enumerate(INCA_files):
            if os.path.isdir(os.path.join(RAW_INCA_DIR, file)):
                continue # ignore any directories found

            if re.findall(r"(dec{1,2}el)|(downhill)", file, flags=re.IGNORECASE):
                try:
                    ThisRun = self.create_downhill_run(file)
                except FilenameError as exception_text:
                    print(exception_text)
                    # https://stackoverflow.com/questions/1483429/how-to-print-an-exception-in-python
                    input("\nRun creation failed with file '%s'.\n"
                          "Press Enter to skip this run." % (file))
                    print("") # blank line
                    continue # Don't add to run dict

            else:
                try:
                    ThisRun = self.create_ss_run(file)
                except FilenameError as exception_text:
                    print(exception_text)
                    # https://stackoverflow.com/questions/1483429/how-to-print-an-exception-in-python
                    input("\nRun creation failed with file '%s'.\n"
                          "Press Enter to skip this run." % (file))
                    print("") # blank line
                    continue # Don't add to run dict

            if ThisRun.get_run_label() in self.run_dict:
                # catch duplicate run nums.
                dup_answ = ""
                while dup_answ.lower() not in ["1", "2"]:
                    print("More than one run %s found in %s:\n"
                        "\t1. '%s'\n"
                        "\t2. '%s'\n"
                        "Which one should be used as run %s? (1/2)"
                        % (ThisRun.get_run_label(), RAW_INCA_DIR,
                         self.run_dict[ThisRun.get_run_label()].get_inca_filename(),
                         file, ThisRun.get_run_label()))
                    dup_answ = input("> ")
                if dup_answ.lower() == "1":
                    print("") # blank line
                    continue
                if dup_answ.lower() == "2":
                    # fall through
                    pass

            self.run_dict[ThisRun.get_run_label()] = ThisRun

    def create_ss_run(self, filename):
        return SSRun(os.path.join(RAW_INCA_DIR, filename), self.verbosity,
                                                                    self.warn_p)

    def create_downhill_run(self, filename):
        return DownhillRun(os.path.join(RAW_INCA_DIR, filename), self.verbosity,
                                                                    self.warn_p)

    def process_runs(self, process_all, start_run):
        """Processes runs in RunGroup."""
        if process_all:
            # automatically process all INCA runs (below)
            self.runs_to_process = dict(self.run_dict) # avoids aliasing.
            if start_run:
                if not self.validate_run_num(start_run):
                    raise FileNameError("Cannot find matching INCA run for -s "
                                                    "argument %s" % start_run)
                # Remove earlier runs
                for run_num in self.run_dict.keys():
                    if run_num < start_run:
                        self.runs_to_process.pop(run_num)
        else:
            # prompt user for single run to process.
            OnlyRun = self.prompt_for_run()
            self.runs_to_process = {OnlyRun.get_run_label(): OnlyRun}

        bad_runs = []
        for run_num in self.runs_to_process:
            RunObj = self.runs_to_process[run_num]
            try:
                RunObj.process_data()
            except Exception:
                RunObj.log_exception("Processing")
                # Stage for removal from run dict.
                bad_runs.append(run_num)
                continue
        if bad_runs:
            for bad_run in bad_runs:
                # Remove any errored runs from run dict so they aren't included
                # in later calls.
                self.runs_to_process.pop(bad_run)

    def plot_runs(self, overwrite=False, desc_str=""):
        """Creates plots for all runs in RunGroup."""
        if not self.runs_to_process:
            print("\nNo valid runs to plot.\n")
            return
        bad_runs = []

        # If only one run in group is to be processed, this will only loop once.
        for run_num in self.runs_to_process:
            RunObj = self.runs_to_process[run_num]
            try:
                RunObj.plot_data(overwrite, desc_str)
            except Exception:
                RunObj.log_exception("Plotting")
                # Stage for removal from run dict.
                bad_runs.append(run_num)
                continue
        if bad_runs:
            for bad_run in bad_runs:
                # Remove any errored runs from run dict so they aren't included
                # in later calls.
                self.runs_to_process.pop(bad_run)

    def export_runs(self, overwrite=False, desc_str=""):
        """Exports data for all runs in RunGroup."""
        if not self.runs_to_process:
            print("\nNo valid runs to export.\n")
            return
        bad_runs = []

        # If only one run in group is to be processed, this will only loop once.
        for run_num in self.runs_to_process:
            RunObj = self.runs_to_process[run_num]
            try:
                RunObj.export_data(overwrite, desc_str)
            except Exception:
                RunObj.log_exception("Exporting")
                # Stage for removal from run dict.
                bad_runs.append(run_num)
                continue
        if bad_runs:
            for bad_run in bad_runs:
                # Remove any errored runs from run dict so they aren't included
                # in later calls.
                self.runs_to_process.pop(bad_run)

    def prompt_for_run(self):
        """Prompts user for what run to process
        Returns SingleRun object."""
        run_prompt = "Enter run num (four digits)\n> "
        target_run_num = input(run_prompt)

        while not self.validate_run_num(target_run_num):
            target_run_num = input(run_prompt)

        return self.run_dict.get(target_run_num)

    def validate_run_num(self, target_run_num):
        """Check if user-entered run num is valid."""
        if len(target_run_num) != 4:
            print("Need a four-digit number.")
            return False
        elif self.run_dict.get(target_run_num):
            return True
        else:
            print("No valid INCA file found matching that run.")
            return False


class SingleRun(object):
    """Represents a single run from the raw_data directory.
    No data is read in until read_data() method called.
    """
    def __init__(self, INCA_path, verbose=False, warn_prompt=False):
        # Create a new object to store and print output info
        self.Doc = Output(verbose, warn_prompt)
        self.INCA_path = INCA_path
        self.INCA_filename = os.path.basename(self.INCA_path)
        self.parse_run_num()

    def parse_run_num(self):
        run_num_match = re.findall(r"(?<=_)\d{4}(?=-)", self.INCA_filename):
        if run_num_match:
            self.run_label = run_num_match[0]
        else:
            raise FilenameError("INCA filename '%s' not in correct format.\n"
            "Expected format is "
            "'[pretext]_[four-digit run num][anything else]'.\nNeed the four "
            "characters that follow the first underscore to be run num."
                                                        % self.INCA_filename)

        # Create metadata string to document in outuput file
        self.meta_str = "INCA_file: '%s' | " % self.INCA_filename

    def process_data(self):
        """Run all processing methods on run data."""
        self.read_data()
        self.sync_data()
        if int(self.run_label[:2]) > 5:
            # only needed for torque-meter runs.
            self.combine_torque()
            self.calc_gnd_speed()
        self.abridge_data()
        self.add_math_channels()

    def find_edaq_path(self, eDAQ_file_num):
        """Locate path to eDAQ file corresponding to INCA run num."""
        if not os.path.exists(RAW_EDAQ_DIR):
            raise DataReadError("No raw eDAQ directory found. Put data in this"
                                                "folder: %s" % RAW_EDAQ_DIR)
        all_eDAQ_runs = os.listdir(RAW_EDAQ_DIR)
        found_eDAQ = False # initialize to false. Will change if file is found.
        for eDAQ_run in all_eDAQ_runs:
            if os.path.isdir(os.path.join(RAW_EDAQ_DIR, eDAQ_run)):
                continue # ignore any directories found

            run_num_match = re.findall(r"(?<=\d{8}_)\d{2}(?=[.-])", eDAQ_run)
            if run_num_match:
                run_num_i = run_num_match[0]
            else:
                raise FilenameError("eDAQ filename '%s' not in correct format."
                "\nExpected format is "
                "'[pretext]_[two-digit file num][anything else]'.\nNeed the "
                "two characters that follow the first underscore to be file "
                "num.\nThis will cause problems with successive runs until you "
                "fix the filename or remove the offending file from %s."
                                                    % (eDAQ_run, RAW_EDAQ_DIR))
            if run_num_i == eDAQ_file_num and not found_eDAQ:
                target_edaq_run = eDAQ_run
                found_eDAQ = True
            elif run_num_i == eDAQ_file_num:
                # Duplicate found
                raise FilenameError("More than one eDAQ file with '%s' "
                    "designation. This will cause problems with successive runs "
                    "until you remove duplicate files from %s."
                                            % (eDAQ_file_num, RAW_EDAQ_DIR))

        if found_eDAQ:
            self.eDAQ_path = os.path.join(RAW_EDAQ_DIR, target_edaq_run)
            # Document in metadata string for later file output.
            self.meta_str += "eDAQ file: '%s' | " % target_edaq_run
        else:
            raise FilenameError("No eDAQ file found for run %s" % eDAQ_file_num)

    def read_data(self):
        """Read in both INCA and eDAQ data from raw_data directory."""
        eDAQ_file_num = self.run_label[0:2]
        self.find_edaq_path(eDAQ_file_num)

        # Channels changed starting with eDAQ file "06"
        if int(eDAQ_file_num) > 5:
            self.edaq_channels = EDAQ_CHANNELS_6
        else:
            self.edaq_channels = EDAQ_CHANNELS_5

        # Read in both eDAQ and INCA data for specific run.
        # Read INCA data first
        # File automatically closed at end of "with/as" block.
        with open(self.INCA_path, "r") as inca_ascii_file:
            self.Doc.print("\nReading INCA data from %s" % self.INCA_path)
            INCA_file_in = csv.reader(inca_ascii_file, delimiter="\t")
            # https://stackoverflow.com/questions/7856296/parsing-csv-tab-delimited-txt-file-with-python

            raw_inca_dict = {}
            for channel in INCA_CHANNELS:
                raw_inca_dict[channel] = []

            for i, INCA_row in enumerate(INCA_file_in):
                if i == 2:
                    # print channel order for debugging
                    self.Doc.print("\tINCA file channels:\t" +
                                "  -  ".join([str(c) for c in INCA_row]), True)
                    self.Doc.print("\tAssumed channel order:\t" +
                           "  -  ".join([str(c) for c in INCA_CHANNELS]), True)

                    # Explicitly check for improper channel order:
                    if ("time" not in INCA_row[INCA_CHANNELS.index("time")] or
                       "SW_PEDAL" not in INCA_row[INCA_CHANNELS.index("pedal_sw")] or
                       "NE" not in INCA_row[INCA_CHANNELS.index("engine_spd")] or
                       "THagr" not in INCA_row[INCA_CHANNELS.index("throttle")]):
                       raise DataReadError("Bad channel order in INCA file.")
                    continue
                elif i < INCA_HEADER_HT:
                    # ignore headers
                    continue
                else:
                    for n, channel in enumerate(INCA_CHANNELS):
                        raw_inca_dict[channel].append(float(INCA_row[n]))

        # Convert the dict to a pandas DataFrame for easier manipulation
        # and analysis.
        self.raw_inca_df = pd.DataFrame(data=raw_inca_dict,
                                                    index=raw_inca_dict["time"])
        self.Doc.print("...done")

        self.Doc.print("\nraw_inca_df after reading in data:", True)
        self.Doc.print(self.raw_inca_df.to_string(max_rows=10, max_cols=7,
                                                show_dimensions=True), True)
        self.Doc.print("", True)

        # Now read eDAQ data
        with open(self.eDAQ_path, "r") as edaq_ascii_file:
            self.Doc.print("Reading eDAQ data from %s" % self.eDAQ_path)
            eDAQ_file_in = csv.reader(edaq_ascii_file, delimiter="\t")

            raw_edaq_dict = {}
            for channel in self.edaq_channels:
                raw_edaq_dict[channel] = []

            for j, eDAQ_row in enumerate(eDAQ_file_in):
                if j < EDAQ_HEADER_HT-1:
                    pass
                elif j == EDAQ_HEADER_HT-1:
                    # The first row is a list of channel names.
                    # Converting to int and back to str strips zero padding
                    sub_run_num = int(self.run_label[2:4])
                    edaq_sub_run = "RN_"+str(sub_run_num)

                    # Loop through and find the first channel for this run.
                    for n, col in enumerate(eDAQ_row):
                        if edaq_sub_run in col:
                            edaq_run_start_col = n
                            break

                    if n == len(eDAQ_row) - 1:
                        # Got to end of row and didn't find the run in any
                        # column heading
                        raise DataReadError("Can't find %s in any eDAQ file" %
                                                                edaq_sub_run)

                elif eDAQ_row[edaq_run_start_col+1]:
                    # Need to make sure we haven't reached end of channel strm.
                    # Time vector may keep going past a channel's data, so look
                    # at a run-specific channel to see if the run's ended.

                    # Time is always in 1st column.
                    raw_edaq_dict["time"].append(float(eDAQ_row[0]))
                    for n, channel in enumerate(self.edaq_channels[1:]):
                        # Only add this run's channels to our data list.
                        raw_edaq_dict[channel].append(
                                        float(eDAQ_row[edaq_run_start_col+n]))

        self.raw_edaq_df = pd.DataFrame(data=raw_edaq_dict,
                                                    index=raw_edaq_dict["time"])

        self.Doc.print("...done")
        self.Doc.print("\nraw_edaq_df after reading in data:", True)
        self.Doc.print(self.raw_edaq_df.to_string(max_rows=10, max_cols=7,
                                                    show_dimensions=True), True)

    def sync_data(self):
        # Create copies of the raw dfs to modify and merge.
        inca_df = self.raw_inca_df.copy(deep=True)
        edaq_df = self.raw_edaq_df.copy(deep=True)

        # Convert index from seconds to hundredths of a second
        # It's simple for eDAQ data.
        edaq_df.set_index(pd.Index([int(round(ti * SAMPLING_FREQ))
                                        for ti in edaq_df.index]), inplace=True)
        # https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.set_index.html
        # Offset time series to start at zero.
        self.shift_time_series(edaq_df, zero=True)

        # INCA time increments are slightly off, so error accumulates and
        # can eventually cause issues (alternating 0.00 and 0.02s periods
        # after rounding).
        # Convert INCA to deltas by subtracting each time value from previous
        # one, rounding the delta and adding to the previous (rounded) value.
        # Calculate the rolling difference (delta) between each pair of vals.
        deltas = inca_df["time"].diff()
        # https://stackoverflow.com/questions/13114512/calculating-difference-between-two-rows-in-python-pandas
        deltas[0] = 0 # first val was NaN
        # Round the series then do a cumulative summation:
        deltas = pd.Series([round(ti * SAMPLING_FREQ) for ti in deltas])
        rolling_delt_times = deltas.cumsum()
        # Assign as the index now (converting to int)
        inca_df.set_index(pd.Index(rolling_delt_times.astype(int)), inplace=True)

        # Check if any pedal events exist
        if inca_df.loc[inca_df["pedal_sw"] == 1].empty:
            raise DataSyncError("No pedal event found in INCA data (looking for"
            " value of 1 in pedal switch column). Check input pedal data and "
            "ordering of input file's columns.")
        if edaq_df.loc[edaq_df["pedal_sw"] == 1].empty:
            raise DataSyncError("No pedal event found in eDAQ data (looking for"
            " value of 1 in pedal switch column). Check input pedal data and "
            "ordering of input file's columns.")
        # Find first pedal switch event.
        # https://stackoverflow.com/questions/16683701/in-pandas-how-to-get-the-index-of-a-known-value
        inca_high_start_t = inca_df.loc[inca_df["pedal_sw"] == 1].index[0]
        edaq_high_start_t = edaq_df.loc[edaq_df["pedal_sw"] == 1].index[0]
        self.Doc.print("\nStart times (inca, edaq): %.2fs, %.2fs"
                                    % (inca_high_start_t / SAMPLING_FREQ,
                                       edaq_high_start_t / SAMPLING_FREQ), True)

        # Test first to see if either data set has first pedal event earlier
        # than 1s. If so, that's the new time for both files to align on.
        start_buffer = min([1 * SAMPLING_FREQ, inca_high_start_t,
                                                            edaq_high_start_t])
        self.Doc.print("Start buffer: %0.2fs"
                                           % (start_buffer/SAMPLING_FREQ), True)

        # Shift time values, leaving negative values in early part of file that
        # will be trimmed off below.
        inca_target_t = inca_high_start_t - start_buffer
        edaq_target_t = edaq_high_start_t - start_buffer
        self.shift_time_series(inca_df, offset_val=-inca_target_t)
        self.shift_time_series(edaq_df, offset_val=-edaq_target_t)
        self.Doc.print("First INCA sample shifted to time %0.2fs"
                                    % (inca_df.index[0]/SAMPLING_FREQ), True)
        self.Doc.print("First eDAQ sample shifted to time %0.2fs"
                                    % (edaq_df.index[0]/SAMPLING_FREQ), True)

        # Unify datasets into one DataFrame/
        # Slice out values before t=0 (1s before first pedal press)
        # Truncate file with extra time vals at end. Will not happen during
        # join() because of the "outer" option creating union to catch any
        # time gaps in either dataset (has happened in INCA runs).
        end_time = min(inca_df.index[-1], edaq_df.index[-1])

        # Leave out redundant channels in eDAQ data.
        # Carry over raw time for debugging purposes.
        # The suffix options keep the two DFs' time columns from conflicting.
        self.sync_df = inca_df.loc[0:end_time].join(
               edaq_df.loc[0:end_time, edaq_df.drop(
                                    columns=["pedal_v", "pedal_sw"]).columns],
                         lsuffix="_raw_inca", rsuffix="_raw_edaq", how="outer")

        # https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.join.html#pandas.DataFrame.join
        self.Doc.print("\nsync_df at end of sync:", True)
        self.Doc.print(self.sync_df.to_string(max_rows=10, max_cols=7,
                                                    show_dimensions=True), True)

    def shift_time_series(self, df, zero=False, offset_val=None):
        """If offset_val param specified, add this signed value to all time
        values.
        If zero param passed, offset all such that first val is 0."""
        if zero:
            offset_val = -df.index[0]
        elif offset_val==None:
            raise DataSyncError("shift_time_series needs either zero or "
                                                    "offset_val param.")

        df.set_index(df.index + offset_val, inplace=True)

    def combine_torque(self):
        """Sums LR and RR wheel torque readings.
        Used when processing runs 06xx+ that use torque meters."""
        tq_sum = wspd_avg = self.sync_df[["wtq_RR", "wtq_LR"]].sum(axis=1)

        # Remove original columns and replace with combined one.
        self.sync_df.drop(columns=["wtq_RR", "wtq_LR"], inplace=True)
        self.sync_df["rear_wtq_combined"] = tq_sum
        CHANNEL_UNITS["rear_wtq_combined"] = CHANNEL_UNITS["wtq_RR"]

    def calc_gnd_speed(self):
        """Averages LR and RR angular wheel speeds.
        Used when processing runs 06xx+ that use torque meters."""
        wspd_avg = self.sync_df[["wspd_RR", "wspd_LR"]].mean(axis=1)
        # Remove wheel speed channels since we don't want them written to sync file.
        self.sync_df.drop(columns=["wspd_RR", "wspd_LR"], inplace=True)

        # Convert to linear speed.
        tire_circ = np.pi * TIRE_DIAM_IN * ROLLING_RADIUS_FACTOR # inches
        gnd_spd_in_min = wspd_avg * tire_circ

        self.sync_df["gnd_speed"] = gnd_spd_in_min / (5280 * 12/60) # inches/min to mph

    def knit_pedal_gaps(self):
        """Finds any gaps in INCA pedal channel and fills them if pedal signal
        is high before and after gap. Prevents false-negative in abridge
        algo."""
        na_times = self.sync_df["pedal_sw"][self.sync_df["pedal_sw"].isna()]

        if len(na_times) == 0:
            self.Doc.print("\nNo missing INCA times found.")
            return
        else:
            self.Doc.print("\nMissing INCA times (len: %d):" % len(na_times), True)
            self.Doc.print(na_times.to_string(max_rows=10), True)

        # Filter trivial case of gap length 1 to avoid IndexError below.
        if len(na_times) == 1:
            # set variables used in reassignment loop below
            gap_ranges = [na_times.index[0], na_times.index[0]]
        elif len(na_times) > 1:
            # Step through na_times and identify any discontinuities, indicating
            # multiple gaps in the data.
            gap_ranges = []
            current_range = [na_times.index[0]]
            for i, time in enumerate(na_times.index[1:]):
                prev_time = na_times.index[i] # i is behind by one.
                if time - prev_time > 1:
                    current_range.append(prev_time)
                    gap_ranges.append(current_range)
                    # Reset range
                    current_range = [time]
            # Add last value to end of last range
            current_range.append(time)
            gap_ranges.append(current_range)

        self.Doc.print("\nContinuous INCA sample gaps: ")
        for range in gap_ranges:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
                        % (range[0] / SAMPLING_FREQ, range[1] / SAMPLING_FREQ))
        # https://stackoverflow.com/questions/973568/convert-nested-lists-to-string

        for range in gap_ranges:
            # Find time values before and after gap
            pre_time_i = self.sync_df.index.get_loc(range[0]) - 1
            post_time_i = self.sync_df.index.get_loc(range[-1]) + 1
            pre_time = self.sync_df.index[pre_time_i]
            post_time = self.sync_df.index[post_time_i]
            # https://stackoverflow.com/questions/28837633/pandas-get-position-of-a-given-index-in-dataframe
            knit = False
            if (self.sync_df.at[pre_time, "pedal_sw"]
                                 and self.sync_df.at[post_time, "pedal_sw"]):
                # Only need to knit gap if pedal was actuated before gap and
                # still actuated after. Assume no interruption during gap.
                self.Doc.print("\nKnitting pedal event in gap %0.2f -> %0.2f"
                        % (range[0] / SAMPLING_FREQ, range[-1] / SAMPLING_FREQ))

                self.sync_df.at[range[0]:range[1]+1, "pedal_sw"] = 1
                knit = True

                self.Doc.print("\nsync_df after knitting pedal event:", True)
                self.Doc.print(self.sync_df[range[0]-2:range[1]+3].to_string(
                        max_rows=10, max_cols=7, show_dimensions=True), True)

            if not knit:
                self.Doc.print("\nNo pedal events to knit.")

    def abridge_data(self):
        # Implemented in child classes
        # Different version of this function in SSRun vs. DownhillRun
        pass

    def add_math_channels(self):
        # Implemented in child classes
        # Different version of this function in SSRun vs. DownhillRun
        pass

    def add_cvt_ratio(self):
        """Calculate instantaneous CVT ratio and include in abridged dataframe."""
        tire_circ = np.pi * TIRE_DIAM_IN * ROLLING_RADIUS_FACTOR # inches

        if self.get_run_type() == "SSRun":
            gnd_spd_in_min = self.abr_df["gnd_speed"] * 5280 * 12/60 # inches/min
        elif self.get_run_type() == "DownhillRun":
            # Downhill run already has rolling avg available.
            # Using this more stable data to generate CVT ratio for plot.
            gnd_spd_in_min = self.math_df["gs_rolling_avg"] * 5280 * 12/60 # inches/min

        tire_ang_spd = gnd_spd_in_min / tire_circ
        self.math_df["input_shaft_ang_spd"] = tire_ang_spd * AXLE_RATIO * GEARBOX_RATIO
        self.math_df["cvt_ratio"] = (self.abr_df["engine_spd"]
                                        / self.math_df["input_shaft_ang_spd"])

        # # Remove any values that are zero or > 5 (including infinite).
        self.math_df["cvt_ratio_mskd"] = self.math_df["cvt_ratio"].mask(
            (self.math_df["cvt_ratio"] > 5) | (self.math_df["cvt_ratio"] <= 0))

        # Transcribe to main DF for export
        self.abr_df["CVT_ratio_calc"] = self.math_df["cvt_ratio_mskd"].copy()
        CHANNEL_UNITS["CVT_ratio_calc"] = "rpm/rpm"

    def plot_data(self, overwrite=False, description=""):
        """Plot various raw and calculated data from run.
        Child classes add to this."""
        self.overwrite = overwrite
        self.description = description
        self.Doc.print("") # blank line

        self.plot_abridge_compare()
        self.plot_cvt_ratio()

    def plot_abridge_compare(self):
        # Implemented in child classes
        # Different version of this function in SSRun vs. DownhillRun
        pass

    def plot_cvt_ratio(self):
        """Plot calculated CVT ratio along with other data for evaluation."""

        ax1 = plt.subplot(311)
        # https://matplotlib.org/3.2.1/api/_as_gen/matplotlib.pyplot.subplot.html

        plt.plot(self.math_df.index/SAMPLING_FREQ,
                 self.math_df["gs_rolling_avg"], color="lightgrey", zorder=2)
        plt.plot(self.math_df.index/SAMPLING_FREQ,
                 self.math_df["gs_rol_avg_mskd"], color="r", zorder=3)
        ax1.set_ylabel("Speed (mph)")

        if self.get_run_type() == "SSRun" and ~np.isnan(self.math_df.at[0, "SS_gnd_spd_avg"]):
            # plot average for steady-state run
            avg = self.math_df.at[0, "SS_gnd_spd_avg"]
            color="lightcoral"
            ax1.axhline(avg, color=color, zorder=1)
            if avg > ax1.get_ylim()[1]*2/10:
                y_pos = avg - ax1.get_ylim()[1]/8
            else:
                y_pos = avg + ax1.get_ylim()[1]/10
            ax1.text(ax1.get_xlim()[0], y_pos, str(round(avg, 1)), color=color,
                                                            fontsize="x-small")
        elif self.get_run_type() == "DownhillRun":
            # Plot slopes for downhill run
            # Restore existing y-axis limits after adding slopes because slopes
            # may extend beyond optimal window limits.
            ylims = ax1.get_ylim()
            color = "lightcoral"
            plt.plot(self.math_df.index/SAMPLING_FREQ,
                    self.math_df["trendlines"], color=color, zorder=1, scaley=False)
            ax1.set_ylim(ylims)
            ax1.text(ax1.get_xlim()[0], ax1.get_ylim()[1]*9/10,
              " Eng-on: %.2f" % self.math_df.at[0, "accel_avg_calc_eng_on"],
                                                color=color, fontsize="x-small")
            ax1.text(ax1.get_xlim()[0], ax1.get_ylim()[1]*8/10,
              " Eng-off: %.2f" % self.math_df.at[0, "accel_avg_calc_eng_off"],
                                                color=color, fontsize="x-small")

            # https://stackoverflow.com/questions/7386872/make-matplotlib-autoscaling-ignore-some-of-the-plots
            # https://matplotlib.org/3.1.1/gallery/misc/zorder_demo.html
        plt.title("Run %s - CVT Ratio (Abridged Data)" % self.run_label, loc="left")
        plt.setp(ax1.get_xticklabels(), visible=False) # x labels only on bottom

        ax2 = plt.subplot(312, sharex=ax1)

        if self.get_run_type() == "SSRun":
            es_rolling_avg = self.math_df["es_rolling_avg"]
            engine_spd_mskd = self.math_df["es_rol_avg_mskd"]
        elif self.get_run_type() == "DownhillRun":
            es_rolling_avg = self.abr_df["engine_spd"]
            engine_spd_mskd = self.abr_df["engine_spd"].mask(~self.math_df["downhill_filter"])

        plt.plot(self.abr_df.index/SAMPLING_FREQ, es_rolling_avg, color="lightgrey", zorder=2)
        plt.plot(self.abr_df.index/SAMPLING_FREQ, engine_spd_mskd, color="tab:blue", zorder=3)
        if self.get_run_type() == "SSRun" and ~np.isnan(self.math_df.at[0, "SS_eng_spd_avg"]):
            # plot average for steady-state run
            avg = self.math_df.at[0, "SS_eng_spd_avg"]
            color = "lightsteelblue"
            ax2.axhline(avg, color=color, zorder=1)
            if avg > ax2.get_ylim()[1]*2/10:
                y_pos = avg - ax2.get_ylim()[1]/10
            else:
                y_pos = avg + ax2.get_ylim()[1]/10
            ax2.text(ax2.get_xlim()[0], y_pos, "%.0f" % avg, color=color,
                                                            fontsize="x-small")
        ax2.set_ylabel("Engine Speed (rpm)")

        plt.setp(ax2.get_xticklabels(), visible=False) # x labels only on bottom

        ax3 = plt.subplot(313, sharex=ax1)

        plt.plot(self.math_df.index/SAMPLING_FREQ, self.math_df["cvt_ratio"],
                                                    color="lightgrey", zorder=2)
        plt.plot(self.math_df.index/SAMPLING_FREQ, self.math_df["cvt_ratio_mskd"],
                                                    color="tab:green", zorder=3)
        ax3.set_ylim([-0.2, 4])
        ax3.set_yticks([0, 1, 2, 3, 4])
        if self.get_run_type() == "SSRun" and ~np.isnan(self.math_df.at[0, "SS_cvt_ratio_avg"]):
            # plot average for steady-state run
            avg = self.math_df.at[0, "SS_cvt_ratio_avg"]
            color="lightgreen"
            ax3.axhline(avg, color=color, zorder=1)
            if avg > ax3.get_ylim()[1]*2/10:
                y_pos = avg - ax3.get_ylim()[1]/10
            else:
                y_pos = avg + ax3.get_ylim()[1]/25
            ax3.text(ax3.get_xlim()[0], y_pos, "  " + str(round(avg, 1)),
                                                color=color, fontsize="x-small")
        ax3.set_ylabel("CVT Ratio Calc")
        ax3.set_xlabel("Time (s)")


        # plt.show() # can't use w/ WSL. Export instead.
        # https://stackoverflow.com/questions/43397162/show-matplotlib-plots-and-other-gui-in-ubuntu-wsl1-wsl2
        self.export_plot("cvt")
        plt.clf()
        # https://stackoverflow.com/questions/8213522/when-to-use-cla-clf-or-close-for-clearing-a-plot-in-matplotlib

    def export_plot(self, type):
        """Exports plot that's already been created with another method.
        Assumes caller method will clear figure afterward."""
        if self.description:
            fig_filepath = ("%s/%s_%s-%s.png"
                            % (PLOT_DIR, self.run_label, type, self.description))
        else:
            fig_filepath = "%s/%s_%s.png" % (PLOT_DIR, self.run_label, type)

        short_hash_len = 6
        # Check for existing fig with same filename including description but
        # EXCLUDING hash.
        wildcard_filename = (os.path.splitext(fig_filepath)[0]
                            + "-#" + "?"*short_hash_len
                            + os.path.splitext(fig_filepath)[1])
        if glob.glob(wildcard_filename) and not self.overwrite:
            ow_answer = ""
            while ow_answer.lower() not in ["y", "n"]:
                self.Doc.print("\n%s already exists in figs folder. Overwrite? (Y/N)"
                                        % os.path.basename(wildcard_filename))
                ow_answer = input("> ")
            if ow_answer.lower() == "y":
                for filepath in glob.glob(wildcard_filename):
                    os.remove(filepath)
                # continue with rest of function
            elif ow_answer.lower() == "n":
                # plot will be cleared in caller function.
                return
        elif glob.glob(wildcard_filename) and self.overwrite:
            for filepath in glob.glob(wildcard_filename):
                os.remove(filepath)
                # Must manually remove because if figure hash changes, it will
                # not overwrite original.

        plt.savefig(fig_filepath)
        # Calculate unique hash value (like a fingerprint) to output in CSV's
        # meta_str. Put in img filename too.
        img_hash = hashlib.sha1(Image.open(fig_filepath).tobytes())
        # https://stackoverflow.com/questions/24126596/print-md5-hash-of-an-image-opened-with-pythons-pil
        hash_text = img_hash.hexdigest()[:short_hash_len]
        fig_filepath_hash = (os.path.splitext(fig_filepath)[0] + "-#"
                                + hash_text + os.path.splitext(fig_filepath)[1])
        os.rename(fig_filepath, fig_filepath_hash)
        self.Doc.print("Exported plot as %s." % fig_filepath_hash)
        self.meta_str += ("Corresponding %s fig hash: '%s' | "
                                                            % (type, hash_text))

    def export_data(self, overwrite=False, description=""):
        """Output CSV file with synced and abridged data, including some
        calculated channels and aggregated values."""
        self.overwrite = overwrite
        self.description = description

        export_df = self.abr_df.drop(columns=["time_raw_inca", "time_raw_edaq"])
        # https://stackoverflow.com/questions/29763620/how-to-select-all-columns-except-one-column-in-pandas

        if self.get_run_type() == "SSRun":
            # Pad the columns to not overlap Downhill-specific columns.
            speed_index = export_df.columns.get_loc("gnd_speed")
            export_df.insert(speed_index + 1, "gnd_speed_reg_slope", np.nan)
            CHANNEL_UNITS["gnd_speed_reg_slope"] = CHANNEL_UNITS["gnd_speed"] + "/s"

            # Add some channels from math_df
            export_df["SS_gnd_spd_avg_calc"] = self.math_df["SS_gnd_spd_avg"]
            export_df["SS_eng_spd_avg_calc"] = self.math_df["SS_eng_spd_avg"]
            export_df["SS_cvt_ratio_avg_calc"] = self.math_df["SS_cvt_ratio_avg"]
            CHANNEL_UNITS["SS_gnd_spd_avg_calc"] = CHANNEL_UNITS["gnd_speed"]
            CHANNEL_UNITS["SS_eng_spd_avg_calc"] = CHANNEL_UNITS["engine_spd"]
            CHANNEL_UNITS["SS_cvt_ratio_avg_calc"] = CHANNEL_UNITS["CVT_ratio_calc"]

        elif self.get_run_type() == "DownhillRun":
            # Pad the columns to not overlap SS-specific columns.
            export_df[" "] = np.nan
            export_df["  "] = np.nan
            export_df["   "] = np.nan
            CHANNEL_UNITS[" "] = ""
            CHANNEL_UNITS["  "] = ""
            CHANNEL_UNITS["   "] = ""

            # Add some channels from math_df
            export_df["accel_avg_calc_eng_on"] = self.math_df["accel_avg_calc_eng_on"]
            export_df["accel_avg_calc_eng_off"] = self.math_df["accel_avg_calc_eng_off"]
            CHANNEL_UNITS["accel_avg_calc_eng_on"] = CHANNEL_UNITS["gnd_speed"] + "/s"
            CHANNEL_UNITS["accel_avg_calc_eng_off"] = CHANNEL_UNITS["accel_avg_calc_eng_on"]

        # More column-padding, but only needed for runs w/o torque meters.
        if int(self.run_label[:2]) < 6:
            speed_index = export_df.columns.get_loc("gnd_speed")
            export_df.insert(speed_index, "rear_wtq_combined", np.nan)
            CHANNEL_UNITS["rear_wtq_combined"] = CHANNEL_UNITS["wtq_RR"]


        # Replace any NaNs with blanks
        export_df.fillna("", inplace=True)
        # https://stackoverflow.com/questions/26837998/pandas-replace-nan-with-blank-empty-string

        # Convert to list of lists for easier writing out
        sync_array = export_df.values.tolist()
        # https://stackoverflow.com/questions/28006793/pandas-dataframe-to-list-of-lists

        # Convert time values from hundredths of a second to seconds
        time_series = [round(ti/SAMPLING_FREQ,2)
                                    for ti in export_df.index.tolist()]

        for line_no, line in enumerate(sync_array):
            # prepend time values
            sync_array[line_no].insert(0, time_series[line_no])
            # https://stackoverflow.com/questions/8537916/whats-the-idiomatic-syntax-for-prepending-to-a-short-python-list

        # Format header rows
        channel_list = ["time"] + export_df.columns.tolist()
        header_rows = [channel_list, [CHANNEL_UNITS[c] for c in channel_list]]

        # Add headers to array
        sync_array.insert(0, header_rows[1])
        sync_array.insert(0, header_rows[0])

        # Add metadata string
        sync_array.insert(0, [self.get_meta_str()])

        if self.description:
            sync_basename = "%s_Sync-%s.csv" % (self.run_label, self.description)
        else:
            sync_basename = "%s_Sync.csv" % self.run_label

        sync_filename = "%s/%s" % (SYNC_DIR, sync_basename)

        # Check if file exists already. Prompt user for overwrite decision.
        if os.path.exists(sync_filename) and not self.overwrite:
            ow_answer = ""
            while ow_answer.lower() not in ["y", "n"]:
                self.Doc.print("\n%s already exists in sync_data folder. Overwrite? (Y/N)"
                                                            % sync_basename)
                ow_answer = input("> ")
            if ow_answer.lower() == "n":
                return

        # Create new CSV file and write out. Closes automatically at end of
        # with/as block.
        # This block does not run if answered no to overwrite above.
        with open(sync_filename, 'w+') as sync_file:
            sync_file_csv = csv.writer(sync_file, dialect="excel")

            self.Doc.print("\nWriting combined data to %s..." % sync_filename)
            sync_file_csv.writerows(sync_array)
            self.Doc.print("...done")

    def log_exception(self, operation):
        """Write output file for later debugging upon encountering exception."""
        exception_trace = traceback.format_exc()
        # https://stackoverflow.com/questions/1483429/how-to-print-an-exception-in-python

        timestamp = datetime.now().strftime("%Y-%m-%dT%H%M%S")
        # https://stackoverflow.com/questions/415511/how-to-get-the-current-time-in-python
        filename = "%s_Run%s_%s_error.txt" % (timestamp, self.get_run_label(),
                                                            operation.lower())
        self.Doc.print(exception_trace)
        # Wait one second to prevent overwriting previous error if it occurred less
        # than one second ago.
        time.sleep(1)
        full_path = os.path.join(LOG_DIR, filename)
        with open(full_path, "w") as log_file:
            log_file.write(self.get_output().get_log_dump())

        input("\n%s failed on run %s.\nOutput and exception "
            "trace written to '%s'.\nPress Enter to skip this run."
                                % (operation, self.get_run_label(), full_path))
        print("") # blank line

    def get_run_label(self):
        return self.run_label

    def get_inca_filename(self):
        return self.INCA_filename

    def get_meta_str(self):
        # Remove trailing delimiter
        return self.meta_str[:-3]

    def get_output(self):
        return self.Doc

    def __str__(self):
        return self.run_label

    def __repr__(self):
        return ("SingleRun object for INCA run %s" % self.run_label)


class SSRun(SingleRun):
    """Represents a single run with steady-state operation. INCA file name
    determines SS vs. Downhill."""

    def abridge_data(self):
        """Isolates important events in data by removing any long stretches of
        no pedal input or pedal events during which the throttle position not
        sustained above threshold for enough time.
        """
        # Define constants used to isolating valid events.
        thrtl_thresh = 45 # degrees ("throttle threshold")
        thrtl_t_thresh = 2 # seconds ("throttle time threshold")

        # Need to repair any gaps in INCA samples. If pedal was actuated
        # when sampling cut out, and it was still actuated when the sampling
        # resumed, the abridge_data() algorithmm will treat that as a pedal lift
        # when it likely wasn't.
        self.knit_pedal_gaps()

        # list of start and end times for pedal-down events meeting criteria.
        valid_event_times = []
        # maintain a buffer of candidate pedal-down and throttle time vals.
        ped_buffer = []
        high_throttle_time = [0, 0]

        self.Doc.print("\nSteady-state event parsing:")
        pedal_down = False
        counting = False
        keep = False

        for i, ti in enumerate(self.sync_df.index):
            # Main loop evaluates pedal-down event. Stores event start and end
            # times if inner loop finds criteria met during event.

            if self.sync_df["pedal_sw"][ti] == 1:
                if not pedal_down:
                    self.Doc.print("\tPedal actuated at time\t\t%0.2fs" %
                                                        (ti / SAMPLING_FREQ))
                # pedal currently down
                pedal_down = True
                ped_buffer.append(ti) # add current time to pedal buffer.

                # Calculate throttle over-threshold time to determine event validity
                if not counting and (self.sync_df["throttle"][ti] >
                                                            thrtl_thresh):
                    # first time throttle exceeds threshold
                    self.Doc.print("\t\tThrottle >%d deg at time\t%0.2fs" %
                                        (thrtl_thresh, ti / SAMPLING_FREQ))
                    high_throttle_time[0] = ti
                    counting = True

                elif counting and (self.sync_df["throttle"][ti] <
                                                            thrtl_thresh):
                    # throttle drops below threshold
                    self.Doc.print("\t\tThrottle <%d deg at time\t%0.2fs" %
                                        (thrtl_thresh, ti / SAMPLING_FREQ))
                    high_throttle_time[1] = self.sync_df.index[i-1] # prev. time
                    delta = high_throttle_time[1] - high_throttle_time[0]
                    self.Doc.print("\t\tThrottle >%d deg total t:\t%0.2fs" %
                                    (thrtl_thresh, delta / SAMPLING_FREQ))
                    # calculate if that over-threshold event lasted long enough.
                    if (high_throttle_time[1] - high_throttle_time[0] >
                                          thrtl_t_thresh * SAMPLING_FREQ):
                        # Multiplying by sampling f to get hundredths of a sec.
                        keep = True
                        # Now the times stored in ped_buffer constitute a valid
                        # event. As long as the pedal switch stays actuated,
                        # subsequent time indices will be added to ped_buffer.
                    counting = False # reset indicator
                    high_throttle_time = [0, 0] # reset

            elif pedal_down: # pedal just lifted
                # Check if event is valid in case switch goes low before
                # throttle angle drops below its threshold.
                if counting:
                    self.Doc.print("\t(Pedal lifted before throttle dropped "
                                          "below %d deg.)" % thrtl_thresh)
                    # similar to above code:
                    high_throttle_time[1] = self.sync_df.index[i-1] # prev. time
                    delta = high_throttle_time[1] - high_throttle_time[0]
                    self.Doc.print("\t\tThrottle >%d deg total t:\t%0.2fs" %
                                     (thrtl_thresh, delta / SAMPLING_FREQ))
                    if (high_throttle_time[1] - high_throttle_time[0] >
                                          thrtl_t_thresh * SAMPLING_FREQ):
                        keep = True
                    counting = False # reset indicator
                    high_throttle_time = [0, 0] # reset

                self.Doc.print("\tPedal lifted at time\t\t%0.2fs\n"
                                                        % (ti/SAMPLING_FREQ))
                if keep:
                    valid_event_times.append( [ped_buffer[0], ped_buffer[-1]] )
                pedal_down = False
                ped_buffer = [] # flush buffer
                keep = False # reset
            else:
                # pedal is not currently down, and wasn't just lifted.
                pass

        # One last check in case pedal-down event was ongoing when file ended.
        if counting:
            self.Doc.print("\t(File ended before throttle dropped "
                                  "below %d deg.)" % thrtl_thresh)
            # similar to above code:
            high_throttle_time[1] = self.sync_df.index[i-1] # prev. time
            delta = high_throttle_time[1] - high_throttle_time[0]
            self.Doc.print("\t\tThrottle >%d deg total t:\t%0.2fs" %
                             (thrtl_thresh, delta / SAMPLING_FREQ))
            if (high_throttle_time[1] - high_throttle_time[0] >
                                  thrtl_t_thresh * SAMPLING_FREQ):
                keep = True
            counting = False # reset indicator
            high_throttle_time = [0, 0] # reset
        self.Doc.print("\tFile ended at time\t\t%0.2fs\n"
                                                % (ti/SAMPLING_FREQ))
        if keep:
            valid_event_times.append( [ped_buffer[0], ped_buffer[-1]] )

        if not valid_event_times:
            # If no times were stored, then alert user but continue with
            # program.
            self.Doc.warn("No valid pedal-down events found in run %s "
                                "(Criteria: throttle >%d deg for >%ds total).\n"
                                "Processing will continue without abridging."
                    % (self.run_label, thrtl_thresh, thrtl_t_thresh))
            self.meta_str += ("No valid pedal-down events found in run. "
                "(Criteria: throttle >%d deg for >%ds total). Data unabridged. | "
                                    % (thrtl_thresh, thrtl_t_thresh))

            self.abr_df = self.sync_df.copy(deep=True)
            return
        else:
            # Document in output file
            self.meta_str += ("Isolated events where throttle exceeded "
                "%d deg for >%ds. Removed extraneous surrounding events. | "
                                    % (thrtl_thresh, thrtl_t_thresh))

        self.Doc.print("Valid steady-state ranges:")
        for event_time in valid_event_times:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
               % (event_time[0] / SAMPLING_FREQ, event_time[1] / SAMPLING_FREQ))

        # Make sure if two valid events (w/ pedal lift between) are closer
        # than 5s, don't cut into either one. Look at each pair of end/start
        # points, and if they're closer than 5s, merge those two.
        valid_event_times_c = [ valid_event_times[0] ]
        for n, pair in enumerate(valid_event_times[1:]):
            earlier_pair = valid_event_times_c[-1]
            if pair[0] - earlier_pair[1] < (5 * SAMPLING_FREQ):
                # Replace the two pairs with a single combined pair
                del valid_event_times_c[-1]
                valid_event_times_c.append([ earlier_pair[0], pair[1] ])
            else:
                valid_event_times_c.append(pair)

        self.Doc.print("After any merges:")
        for event_time in valid_event_times_c:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
                % (event_time[0]/SAMPLING_FREQ, event_time[1] / SAMPLING_FREQ))

        # Add one-second buffer to each side of valid pedal-down events.
        # For more context.
        for n, pair in enumerate(valid_event_times_c):
            if n == 0 and pair[0] <= (1 * SAMPLING_FREQ):
                # Set zero as start value if first time is less than 1s.
                new_start_i = 0
            else:
                new_start_i = self.sync_df.index.get_loc(
                                                pair[0] - 1*SAMPLING_FREQ,
                    method="nearest", tolerance=(1/SAMPLING_FREQ)*SAMPLING_FREQ)

            new_end_i = self.sync_df.index.get_loc(pair[1] + 1*SAMPLING_FREQ,
                                                            method="nearest")
            # If file ends less than 1s after event ends, this will return
            # the last time in the file. No tolerance specified for this reason.

            pair[0] = self.sync_df.index[new_start_i]
            pair[1] = self.sync_df.index[new_end_i]

        self.Doc.print("INCA times with 1-second buffers added:")
        for event_time in valid_event_times_c:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
               % (event_time[0] / SAMPLING_FREQ, event_time[1] / SAMPLING_FREQ))
        self.Doc.print("") # blank line

        # Split DataFrame into valid pieces; store in list
        valid_events = []
        desired_start_t = 0
        for n, time_range in enumerate(valid_event_times_c):
            # create separate DataFrames for just this event
            valid_event = self.sync_df[time_range[0]:time_range[1]]

            # shift time values to maintain continuity.
            shift = time_range[0] - desired_start_t
            self.Doc.print("Shift (event %d): %.2f" % (n, shift / SAMPLING_FREQ)
                                                                         , True)

            self.shift_time_series(valid_event, offset_val=-shift)

            # Add events to lists
            valid_events.append(valid_event)

            # Define next start time to be next time value after new vector's
            # end time.
            desired_start_t = time_range[1]-shift

        self.Doc.print("Shifted ranges:")
        for event in valid_events:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
              % (event.index[0]/SAMPLING_FREQ, event.index[-1] / SAMPLING_FREQ))

        # Now re-assemble the DataFrame with only valid events.
        # https://pandas.pydata.org/pandas-docs/stable/user_guide/merging.html
        self.abr_df = pd.concat(valid_events)
        self.Doc.print("\nabr_df after abridgement:", True)
        self.Doc.print(self.abr_df.to_string(max_rows=10, max_cols=7,
                                                    show_dimensions=True), True)

        self.Doc.print("\nData time span: %.2f -> %.2f (%d data points)" %
          (self.abr_df.index[0]/SAMPLING_FREQ,
                 self.abr_df.index[-1]/SAMPLING_FREQ, len(self.abr_df.index)))

    def add_math_channels(self):
        """Run calculations on data and store in new dataframe."""
        self.math_df = pd.DataFrame(index=self.abr_df.index)
        # https://stackoverflow.com/questions/18176933/create-an-empty-data-frame-with-index-from-another-data-frame
        self.add_cvt_ratio()
        self.add_ss_avgs()

    def add_ss_avgs(self):
        """Identify steady-state regions of data and calculate average vals."""
        win_size_avg = 51  # window size for speed rolling avg.
        win_size_slope = 301 # win size for rolling slope of speed rolling avg.

        gspd_cr = 2.5     # mph. Ground speed (min) criterion for determining if
                          # steady-state event is moving rather than stationary.
        gs_slope_cr = 0.25  # mph/s.
        # Ground-speed slope (max) criterion to est. steady-state. Abs value

        espd_cr = 2750    # rpm. Engine speed (min) criterion for determining if
                          # steady-state event is moving rather than stationary.
        es_slope_cr = 100  # rpm/s.
        # Engine-speed slope (max) criterion to est. steady-state. Abs value

        # Document in metadata string for output file:
        self.meta_str += ("Steady-state calc criteria: "
                          "gnd speed above %s mph, "
                          "gnd speed slope magnitude less than %s mph/s, "
                          "eng speed above %s rpm, "
                          "eng speed slope magnitude less than %s rpm/s | "
                            % (gspd_cr, gs_slope_cr, espd_cr, es_slope_cr))
        self.meta_str += ("Steady-state calc rolling window sizes: "
                                                "%d for avg, %d for slope | "
                                            % (win_size_avg, win_size_slope))

        # Create rolling average and rolling (regression) slope of rolling avg
        # for ground speed.
        self.math_df["gs_rolling_avg"] = self.abr_df.rolling(
                           window=win_size_avg, center=True)["gnd_speed"].mean()
        # https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.rolling.html

        # Create and register a new tqdm instance with pandas.
        # Have to manually feed it the total iteration count.
        tqdm.pandas(total=len(self.abr_df.index)-(win_size_avg-1)-(win_size_slope-1))
        # https://stackoverflow.com/questions/48935907/tqdm-not-showing-bar
        self.Doc.print("\nCalculating rolling regression on ground speed data...")
        self.math_df["gs_rolling_slope"] = self.math_df["gs_rolling_avg"].rolling(
                    window=win_size_slope, center=True).progress_apply(
                        lambda x: np.polyfit(x.index/SAMPLING_FREQ, x, 1)[0])
        # https://stackoverflow.com/questions/18603270/progress-indicator-during-pandas-operations
        self.Doc.print("...done")

        # Create rolling average and rolling (regression) slope of rolling avg
        # for engine speed.
        self.math_df["es_rolling_avg"] = self.abr_df.rolling(
                          window=win_size_avg, center=True)["engine_spd"].mean()

        tqdm.pandas(total=len(self.abr_df.index)-(win_size_avg-1)-(win_size_slope-1))
        # https://stackoverflow.com/questions/48935907/tqdm-not-showing-bar
        self.Doc.print("Calculating rolling regression on engine speed data...")
        self.math_df["es_rolling_slope"] = self.math_df["es_rolling_avg"].rolling(
                    window=win_size_slope, center=True).progress_apply(
                        lambda x: np.polyfit(x.index/SAMPLING_FREQ, x, 1)[0])
        self.Doc.print("...done")

        # Apply speed and speed slope criteria to isolate steady-state events.
        ss_filter = (      (self.math_df["gs_rolling_avg"] > gspd_cr)
                         & (self.math_df["gs_rolling_slope"] < gs_slope_cr)
                         & (self.math_df["gs_rolling_slope"] > -gs_slope_cr)
                         & (self.math_df["es_rolling_avg"] > espd_cr)
                         & (self.math_df["es_rolling_slope"] < es_slope_cr)
                         & (self.math_df["es_rolling_slope"] > -es_slope_cr) )
        # gs_slope_cr and es_slope_cr are abs value so have to apply on high
        # and low end.
        self.Doc.print("\nTotal data points that fail steady-state criteria: %d"
                                                        % sum(~ss_filter), True)
        self.Doc.print("Total data points that meet steady-state criteria: %d"
                                                         % sum(ss_filter), True)
        # https://stackoverflow.com/questions/12765833/counting-the-number-of-true-booleans-in-a-python-list

        self.math_df["steady_state"] = ss_filter

        # "Mask off" by assigning NaN where criteria not met.
        self.math_df["gs_rol_avg_mskd"] = self.math_df["gs_rolling_avg"].mask(
                                                                    ~ss_filter)
        self.math_df["es_rol_avg_mskd"] = self.math_df["es_rolling_avg"].mask(
                                                                    ~ss_filter)
        # Masking these too to calculate avg slope off SS region later:
        self.math_df["gs_rslope_mskd"] = self.math_df["gs_rolling_slope"].mask(
                                                                    ~ss_filter)
        self.math_df["es_rslope_mskd"] = self.math_df["es_rolling_slope"].mask(
                                                                    ~ss_filter)
        # https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#indexing-where-mask

        # No need to run rolling avg or slope on cvt_ratio since we aren't
        # applying criteria to it for purpose of determining steady state.
        self.math_df["cvt_ratio_mskd"].mask(~ss_filter, inplace=True)

        # Calculate overall (aggregate) mean of each filtered/masked channel.
        # Prefill with NaN and assign mean to first element.
        self.math_df["SS_gnd_spd_avg"] = np.nan
        self.math_df.at[0, "SS_gnd_spd_avg"] = np.mean(
                                                self.math_df["gs_rol_avg_mskd"])
        self.math_df["SS_eng_spd_avg"] = np.nan
        self.math_df.at[0, "SS_eng_spd_avg"] = np.mean(
                                                self.math_df["es_rol_avg_mskd"])
        self.math_df["SS_cvt_ratio_avg"] = np.nan
        self.math_df.at[0, "SS_cvt_ratio_avg"] = np.mean(
                                                   self.math_df["cvt_ratio_mskd"])
        # https://stackoverflow.com/questions/13842088/set-value-for-particular-cell-in-pandas-dataframe-using-index
        # https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.at.html

        # pandas rolling(), apply(), regression references:
        # https://stackoverflow.com/questions/47390467/pandas-dataframe-rolling-with-two-columns-and-two-rows
        # https://pandas.pydata.org/pandas-docs/version/0.23.4/whatsnew.html#rolling-expanding-apply-accepts-raw-false-to-pass-a-series-to-the-function
        # https://stackoverflow.com/questions/49100471/how-to-get-slopes-of-data-in-pandas-dataframe-in-python
        # https://www.pythonprogramming.net/rolling-apply-mapping-functions-data-analysis-python-pandas-tutorial/
        # https://stackoverflow.com/questions/21025821/python-custom-function-using-rolling-apply-for-pandas
        # http://greg-ashton.physics.monash.edu/applying-python-functions-in-moving-windows.html
        # https://stackoverflow.com/questions/50482884/module-pandas-has-no-attribute-rolling-mean
        # https://stackoverflow.com/questions/45254174/how-do-pandas-rolling-objects-work
        # https://pandas.pydata.org/pandas-docs/stable/user_guide/computation.html
        # https://becominghuman.ai/linear-regression-in-python-with-pandas-scikit-learn-72574a2ec1a5
        # https://medium.com/the-code-monster/split-a-dataset-into-train-and-test-datasets-using-sk-learn-acc7fd1802e0
        # https://towardsdatascience.com/regression-plots-with-pandas-and-numpy-faf2edbfad4f
        # https://data36.com/linear-regression-in-python-numpy-polyfit/

    def plot_data(self, overwrite=False, description=""):
        # This performs all the actions in the parent class's method
        super(SSRun, self).plot_data(overwrite, description)
        self.plot_ss_range()

    def plot_abridge_compare(self):
        """Creates a plot showing what data was deemed unimportant and removed."""
        ax1 = plt.subplot(211)
        # https://matplotlib.org/3.2.1/api/_as_gen/matplotlib.pyplot.subplot.html
        color = "tab:purple"
        ax1.plot(self.raw_inca_df.index, self.raw_inca_df["throttle"],
                                            color=color, label="Throttle (og)")
        plt.title("Run %s - Abridge Compare" % self.run_label, loc="left")
        ax1.set_ylim([-25, 100]) # Shift throttle trace up
        ax1.set_yticks([0, 20, 40, 60, 80, 100])
        ax1.set_ylabel("Throttle (deg)", color=color)
        ax1.tick_params(axis="y", labelcolor=color)

        ax2 = ax1.twinx() # second plot on same x axis
        # https://matplotlib.org/gallery/api/two_scales.html
        color = "tab:red"
        ax2.plot(self.raw_inca_df.index, self.raw_inca_df["pedal_sw"],
                                        color=color, label="Pedal Switch (og)")
        ax2.set_ylim([-.25, 8]) # scale down pedal switch
        ax2.set_yticks([0, 1])
        ax2.set_ylabel("Pedal Switch", color=color)
        ax2.tick_params(axis="y", labelcolor=color)

        plt.setp(ax1.get_xticklabels(), visible=False) # x labels only on bottom

        ax3 = plt.subplot(212, sharex=ax1, sharey=ax1)
        color = "tab:purple"
        # Convert DF indices from hundredths of a second to seconds
        sync_time_series = [round(ti/SAMPLING_FREQ, 2)
                                                for ti in self.abr_df.index]
        ax3.plot(sync_time_series, self.abr_df["throttle"],
                                        label="Throttle (synced)", color=color)
        plt.xlabel("Time (s)")
        # https://matplotlib.org/3.2.1/gallery/subplots_axes_and_figures/shared_axis_demo.html#sphx-glr-gallery-subplots-axes-and-figures-shared-axis-demo-py

        ax3.set_ylim([-25, 100]) # scale down pedal switch
        ax3.set_yticks([0, 20, 40, 60, 80, 100])
        ax3.set_ylabel("Throttle (deg)", color=color)
        ax3.tick_params(axis="y", labelcolor=color)

        ax3_twin = ax3.twinx() # second plot on same x axis
        # https://matplotlib.org/gallery/api/two_scales.html
        color = "tab:red"
        ax3_twin.plot(sync_time_series, self.abr_df["pedal_sw"],
                                    color=color, label="Pedal Switch (synced)")
        ax3_twin.set_ylim([-.25, 8]) # scale down pedal switch
        ax3_twin.set_yticks([0, 1])
        ax3_twin.set_ylabel("Pedal Switch", color=color)
        ax3_twin.tick_params(axis="y", labelcolor=color)

        # plt.show() # can't use w/ WSL. Export instead.
        # https://stackoverflow.com/questions/43397162/show-matplotlib-plots-and-other-gui-in-ubuntu-wsl1-wsl2
        self.export_plot("abr")
        plt.clf()
        # https://stackoverflow.com/questions/8213522/when-to-use-cla-clf-or-close-for-clearing-a-plot-in-matplotlib

    def plot_ss_range(self):
        """Creates a plot showing highlighted steady-state regions and the data
        used to identify them."""
        ax1 = plt.subplot(311)
        plt.plot(self.abr_df.index/SAMPLING_FREQ, self.abr_df["gnd_speed"],
                                                label="Ground Speed", color="k")
        plt.plot(self.abr_df.index/SAMPLING_FREQ, self.math_df["gs_rolling_avg"],
                                                label="Rolling Avg", color="c")
        plt.plot(self.abr_df.index/SAMPLING_FREQ, self.math_df["gs_rol_avg_mskd"],
                                                label="Steady-state", color="r")
        plt.title("Run %s - Steady-state Isolation (Abridged Data)"
                                                % self.run_label, loc="left")
        plt.ylabel("Speed (mph)")

        plt.setp(ax1.get_xticklabels(), visible=False)

        ax2 = plt.subplot(312, sharex=ax1)
        # Convert DF indices from hundredths of a second to seconds
        plt.plot(self.abr_df.index/SAMPLING_FREQ,
                self.abr_df["engine_spd"], label="Engine Speed", color="yellowgreen")
        plt.plot(self.abr_df.index/SAMPLING_FREQ,
        self.math_df["es_rolling_avg"], label="Rolling Avg", color="tab:orange")
        plt.plot(self.abr_df.index/SAMPLING_FREQ,
        self.math_df["es_rol_avg_mskd"], label="Steady-state", color="tab:blue")

        plt.ylabel("Engine Speed (rpm)")

        plt.setp(ax2.get_xticklabels(), visible=False)

        ax3 = plt.subplot(313, sharex=ax1)
        color = "tab:purple"
        # Convert DF indices from hundredths of a second to seconds
        plt.plot(self.abr_df.index/SAMPLING_FREQ, self.abr_df["throttle"],
                                            label="Throttle", color=color)
        ax3.set_ylim([-25, 100]) # Shift throttle trace up
        ax3.set_yticks([0, 20, 40, 60, 80, 100])
        ax3.set_xlabel("Time (s)")
        ax3.set_ylabel("Throttle (deg)", color=color)
        ax3.tick_params(axis="y", labelcolor=color)

        ax3_twin = ax3.twinx() # second plot on same x axis
        # https://matplotlib.org/gallery/api/two_scales.html
        color = "tab:red"
        ax3_twin.plot(self.abr_df.index/SAMPLING_FREQ, self.abr_df["pedal_sw"], color=color)
        ax3_twin.set_ylim([-.25, 8]) # scale down pedal switch
        ax3_twin.set_yticks([0, 1])
        ax3_twin.set_ylabel("Pedal Switch", color=color)
        ax3_twin.tick_params(axis="y", labelcolor=color)

        # plt.show() # can't use w/ WSL.
        # https://stackoverflow.com/questions/43397162/show-matplotlib-plots-and-other-gui-in-ubuntu-wsl1-wsl2
        self.export_plot("ss")
        plt.clf()
        # https://stackoverflow.com/questions/8213522/when-to-use-cla-clf-or-close-for-clearing-a-plot-in-matplotlib

    def get_run_type(self):
        return "SSRun"


class DownhillRun(SingleRun):
    """Represents a single run with downhill engine-braking operation."""

    def abridge_data(self):
        """Isolates important events in data based on criteria associated
        with downhill operation.
        """
        # Need to repair any gaps in INCA samples. If pedal was actuated
        # when sampling cut out, and it was still actuated when the sampling
        # resumed, the abridge_data() algorithmm will treat that as a pedal lift
        # when it likely wasn't.
        self.knit_pedal_gaps()

        # Apply rolling avg filter to smooth data.
        win_size_avg = 101  # window size for speed rolling avg.
        win_size_slope = 301 # win size for rolling slope of speed rolling avg.
        gspd_cr = 2.5     # mph. Ground speed (min) criterion for discerning
                          # valid downhill event.
        gs_slope_cr = +1.0  # mph/s.
        # Ground-speed slope min criterion to identify increasing speed downhill.
        gs_slope_t_cr = 3.0 # seconds. Continuous amount of time the slope
                            # criterion must be met to keep event.
        throttle_cr = 5.0 # deg. Anything below this interpreted as closed throt.

        # Create rolling average of ground speed (unabridged data).
        gs_rolling_avg = self.sync_df.rolling(
                           window=win_size_avg, center=True)["gnd_speed"].mean()

        tqdm.pandas(total=len(self.sync_df.index)-(win_size_avg-1)-(win_size_slope-1))
        # https://stackoverflow.com/questions/48935907/tqdm-not-showing-bar
        self.Doc.print("\nCalculating rolling regression on ground speed data...")
        gs_rolling_slope = gs_rolling_avg.rolling(
                            window=win_size_slope, center=True).progress_apply(
                        lambda x: np.polyfit(x.index/SAMPLING_FREQ, x, 1)[0])
        self.Doc.print("...done")

        # Apply pedal, throttle, speed, and speed slope criteria to isolate
        # downhill, pedal-up events.
        downhill_filter = (  (  (self.sync_df["pedal_sw"].isna())
                                 | (self.sync_df["throttle"] < throttle_cr)  )
                              & (gs_rolling_avg > gspd_cr)
                              & (gs_rolling_slope > gs_slope_cr)     )
        # NaNs in pedal channel treated as pedal up.

        # Mask off every data point not meeting the filter criteria.
        gs_rol_avg_mskd = gs_rolling_avg.mask(~downhill_filter)
        gs_rol_slope_mskd = gs_rolling_slope.mask(~downhill_filter)
        # Convert to a list of indices.
        valid_times = gs_rol_avg_mskd[~gs_rol_avg_mskd.isna()]

        if len(valid_times) == 0:
            # If no times were stored, then alert user but continue with
            # program.
            self.Doc.warn("No valid downhill events found in run %s (Criteria: "
                "speed slope >%d mph/s, speed >%d mph, and throttle <%d deg).\n"
                                   "Processing will continue without abridging."
                        % (self.run_label, gs_slope_cr, gspd_cr, throttle_cr))
            # Take care of needed assignments that are typically down below.
            self.sync_df["gs_rolling_avg"] = gs_rolling_avg
            self.sync_df["gs_rolling_slope"] = gs_rolling_slope
            self.sync_df["downhill_filter"] = downhill_filter
            self.sync_df["trendlines"] = np.nan
            self.sync_df["slopes"] = np.nan
            self.abr_df = self.sync_df.copy(deep=True)

            self.meta_str += ("No valid downhill events found in run (Criteria: "
            "speed slope >%d mph/s, speed >%d mph, and throttle <%d deg). "
            "Data unabridged. | " % (gs_slope_cr, gspd_cr, throttle_cr))
            return

        # Identify separate continuous ranges.
        cont_ranges = [] # ranges w/ continuous data (no NaNs)
        current_range = [valid_times.index[0]]
        for i, time in enumerate(valid_times.index[1:]):
            prev_time = valid_times.index[i] # i is behind by one.
            if time - prev_time > 1:
                current_range.append(prev_time)
                cont_ranges.append(current_range)
                # Reset range
                current_range = [time]
        # Add last value to end of last range
        current_range.append(time)
        cont_ranges.append(current_range)

        self.Doc.print("\nDownhill ranges (before imposing length req.):", True)
        for event_range in cont_ranges:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
               % (event_range[0] / SAMPLING_FREQ, event_range[1] / SAMPLING_FREQ), True)

        valid_slopes = []
        for range in cont_ranges:
            if range[1]-range[0] > gs_slope_t_cr*SAMPLING_FREQ:
                # Must have > gs_slope_t_cr seconds to count.
                valid_slopes.append(range)
            else:
                # Adjust filter to eliminate these extraneous events.
                downhill_filter[range[0]:range[1]] = False
                pass

        if not valid_slopes:
            # If no times were stored, then alert user but continue with
            # program.
            self.Doc.print("\nNo valid downhill events found in run %s "
            "(Criteria: speed slope >%d mph/s, speed >%d mph, and throttle <%d "
                "deg for >%ds).\nProcessing will continue without abridging."
            % (self.run_label, gs_slope_cr, gspd_cr, throttle_cr, gs_slope_t_cr))
            self.meta_str += ("No valid downhill events found in run (Criteria: "
            "speed slope >%d mph/s, speed >%d mph, and throttle <%d deg for "
            ">%ds). Data unabridged. | "
                          % (gs_slope_cr, gspd_cr, throttle_cr, gs_slope_t_cr))

            self.sync_df["gs_rolling_avg"] = gs_rolling_avg
            self.sync_df["gs_rolling_slope"] = gs_rolling_slope
            self.sync_df["downhill_filter"] = downhill_filter
            self.sync_df["trendlines"] = np.nan
            self.sync_df["slopes"] = np.nan
            self.abr_df = self.sync_df.copy(deep=True)
            return
        else:
            # Document in output file
            self.meta_str += ("Isolated events where speed slope exceeded %d "
            "mph/s with speed >%d mph and throttle <%d deg for >%ds. "
            "Removed extraneous surrounding events. "
            "These same criteria were used for the downhill calcs. | "
                % (gs_slope_cr, gspd_cr, throttle_cr, gs_slope_t_cr))

        # Document window sizes in metadata string for output file:
        self.meta_str += ("Isolation and downhill calc rolling window sizes: "
                                                "%d for avg, %d for slope | "
                                            % (win_size_avg, win_size_slope))

        # Add buffers on each side - find closest point where ground speed
        # <1 mph. Add additional second beyond that.

        slow_filter = (gs_rolling_avg < 1) # mph
        # Mask off every data point not meeting the filter criterion.
        gs_rol_avg_slow = gs_rolling_avg.mask(~slow_filter)
        # Convert to a list of indices.
        slow_times = gs_rol_avg_slow[~gs_rol_avg_slow.isna()]

        # Now loop through event ranges and find "slow" times on either side
        # of range to expand and give context to the event.
        valid_ranges = copy.deepcopy(valid_slopes)
        # When copying list of lists, the contained lists are aliased w/
        # typical list-copy methods like [:] or .copy().
        # https://stackoverflow.com/questions/2612802/list-changes-unexpectedly-after-assignment-how-do-i-clone-or-copy-it-to-prevent
        for n, event_range in enumerate(valid_ranges):
            # Find closest neighbor value that is below 1 mph.
            try:
                # Bias down for first range val
                new_start_i = slow_times.index[slow_times.index.get_loc(event_range[0], method="ffill")]
            except KeyError:
                # get_loc returns a KeyError if no value meeting our criteria
                # exists between start point and start/end of file
                new_start_i = 0

            try:
                # Bias up for second range val.
                new_end_i = slow_times.index[slow_times.index.get_loc(event_range[1], method="bfill")]
            except KeyError:
                new_end_i = len(self.sync_df.index)-1

            event_range[0] = self.sync_df.index[new_start_i]
            event_range[1] = self.sync_df.index[new_end_i]

        # Create overall regression curve (not rolling) for each valid range.
        # Store for later plotting.
        trendlines = pd.Series(np.nan, index=self.sync_df.index)
        slopes = pd.Series(np.nan, index=self.sync_df.index)
        last_end_i = 0
        self.Doc.print("\nValid downhill ranges:")
        for n, event_range in enumerate(valid_slopes):
            # Input each event range's gs_rolling_avg values into np.polyfit
            # Put them in new column. Everywhere else is NaN.
            coeff = np.polyfit(self.sync_df.index[event_range[0]:event_range[1]]/SAMPLING_FREQ,
                               gs_rolling_avg[event_range[0]:event_range[1]], 1)
            poly_fxn = np.poly1d(coeff)
            # https://stackoverflow.com/questions/26447191/how-to-add-trendline-in-python-matplotlib-dot-scatter-graphs

            # Use broader range for trendline plotting so each appears extended
            # in plot used later.
            trendlines[valid_ranges[n][0]:valid_ranges[n][1]-1] = poly_fxn(
                self.sync_df.index[valid_ranges[n][0]:valid_ranges[n][1]-1]/SAMPLING_FREQ)
            # Subtracting one to end index to maintain a NaN between slopes,
            # else plot would draw vertical line joining them.

            # Store slope value itself for later retrieval, this time in the
            # precise window. Same slope val stored at each index in continuous
            # range.
            slopes[event_range[0]:event_range[1]] = coeff[0]

            self.Doc.print("\t%0.2f\t->\t%0.2f\t|    Slope: %+0.2f mph/s"
              % (event_range[0] / SAMPLING_FREQ, event_range[1] / SAMPLING_FREQ,
                  coeff[0]))

        self.Doc.print("After widening range to capture complete event(s):")
        for event_time in valid_ranges:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
                % (event_time[0]/SAMPLING_FREQ, event_time[1] / SAMPLING_FREQ))

        # Make sure if two valid events are closer than 5s, don't cut into
        # either one. Look at each pair of end/start points, and if they're
        # closer than 5s, merge those two.
        # This also handles cases where two or more ranges end up being
        # identical after widening window to closest low-speed areas.
        valid_ranges_c = [ valid_ranges[0] ]
        for n, pair in enumerate(valid_ranges[1:]):
            earlier_pair = valid_ranges_c[-1]
            if pair[0] - earlier_pair[1] < (5 * SAMPLING_FREQ):
                # Replace the two pairs with a single combined pair
                del valid_ranges_c[-1]
                valid_ranges_c.append([ earlier_pair[0], pair[1] ])
            else:
                valid_ranges_c.append(pair)

        self.Doc.print("After any merges:")
        for event_time in valid_ranges_c:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
                % (event_time[0]/SAMPLING_FREQ, event_time[1] / SAMPLING_FREQ))
        self.Doc.print("") # blank line

        # Split DataFrame into valid pieces; store in list
        valid_events = []
        # Cut up and re-join rolling avg channels too for later use.
        # Piggyback on sync_df for now.
        self.sync_df["gs_rolling_avg"] = gs_rolling_avg
        self.sync_df["gs_rolling_slope"] = gs_rolling_slope
        self.sync_df["downhill_filter"] = downhill_filter
        self.sync_df["trendlines"] = trendlines
        self.sync_df["slopes"] = slopes
        desired_start_t = 0
        for n, time_range in enumerate(valid_ranges_c):
            # create separate DataFrame for each event
            valid_event = self.sync_df[time_range[0]:time_range[1]]

            # shift time values to maintain continuity.
            shift = time_range[0] - desired_start_t
            self.Doc.print("Shift (event %d): %.2f" % (n, shift / SAMPLING_FREQ)
                                                                         , True)

            self.shift_time_series(valid_event, offset_val=-shift)

            # Add event to list
            valid_events.append(valid_event)

            # define next start time to be next time value after new vector's
            # end time.
            desired_start_t = time_range[1]-shift

        self.Doc.print("Shifted ranges:")
        for event in valid_events:
            self.Doc.print("\t%0.2f\t->\t%0.2f"
              % (event.index[0]/SAMPLING_FREQ, event.index[-1] / SAMPLING_FREQ))

        # Now re-assemble the DataFrame with only valid events.
        # Carries over rolling and filter channels added to sync_df above.
        self.abr_df = pd.concat(valid_events)
        # https://pandas.pydata.org/pandas-docs/stable/user_guide/merging.html

        self.Doc.print("\nabr_df after abridgement:", True)
        self.Doc.print(self.abr_df.to_string(max_rows=10, max_cols=7,
                                                    show_dimensions=True), True)

        self.Doc.print("\nData time span: %.2f -> %.2f (%d data points)" %
          (self.abr_df.index[0]/SAMPLING_FREQ,
                 self.abr_df.index[-1]/SAMPLING_FREQ, len(self.abr_df.index)))

    def add_math_channels(self):
        """Run calculations on data and store in new dataframe."""
        self.math_df = pd.DataFrame(index=self.abr_df.index)
        # https://stackoverflow.com/questions/18176933/create-an-empty-data-frame-with-index-from-another-data-frame

        # Move channels calculated during abridge to the math_df.
        self.math_df["gs_rolling_avg"] = self.abr_df["gs_rolling_avg"]
        self.math_df["gs_rolling_slope"] = self.abr_df["gs_rolling_slope"]
        self.math_df["downhill_filter"] = self.abr_df["downhill_filter"]
        self.math_df["trendlines"] = self.abr_df["trendlines"]
        self.math_df["slopes"] = self.abr_df["slopes"]
        del self.abr_df["gs_rolling_avg"]
        del self.abr_df["gs_rolling_slope"]
        del self.abr_df["downhill_filter"]
        del self.abr_df["trendlines"]

        # Keep the slopes channel for later export.
        self.abr_df.rename(columns={"slopes": "gnd_speed_reg_slope"}, inplace=True)
        # https://datatofish.com/rename-columns-pandas-dataframe/
        CHANNEL_UNITS["gnd_speed_reg_slope"] = CHANNEL_UNITS["gnd_speed"] + "/s"

        self.add_cvt_ratio()
        self.add_downhill_avgs()

    def add_downhill_avgs(self):
        """Downhill regions already identified. Calculate average vals for these
        regions."""
        self.math_df["gs_rol_avg_mskd"] = self.math_df["gs_rolling_avg"].mask(~self.math_df["downhill_filter"])
        self.math_df["gs_rol_slope_mskd"] = self.math_df["gs_rolling_slope"].mask(~self.math_df["downhill_filter"])
        self.math_df["cvt_ratio_mskd"].mask(~self.math_df["downhill_filter"], inplace=True)
            # CVT values of 0 or above 5 already masked.

        self.Doc.print("\nTotal data points that fail downhill criteria: %d"
                                % sum(~self.math_df["downhill_filter"]), True)
        self.Doc.print("Total data points that meet downhill criteria: %d"
                                 % sum(self.math_df["downhill_filter"]), True)

        # Create separate channels for engine-on and engine-off segments.
        engine_on = (self.abr_df["engine_spd"] > 0)
        engine_off = (self.abr_df["engine_spd"] == 0)

        self.math_df["gs_rol_avg_mskd_eng_on"] = self.math_df["gs_rol_avg_mskd"].mask(
                                                                    engine_off)
        self.math_df["gs_rol_avg_mskd_eng_off"] = self.math_df["gs_rol_avg_mskd"].mask(
                                                                    engine_on)

        self.Doc.print("\nTotal engine-on downhill data points: %d"
                        % self.math_df["gs_rol_avg_mskd_eng_on"].count(), True)
        self.Doc.print("Total engine-off downhill data points: %d"
                        % self.math_df["gs_rol_avg_mskd_eng_off"].count(), True)

        # Calculate aggregate slope (accel is positive / decel is negative)
        self.math_df["accel_avg_calc_eng_on"] = np.nan
        self.math_df.at[0, "accel_avg_calc_eng_on"] = np.mean(
                                        self.math_df["slopes"].mask(engine_off))

        self.math_df["accel_avg_calc_eng_off"] = np.nan
        self.math_df.at[0, "accel_avg_calc_eng_off"] = np.mean(
                                        self.math_df["slopes"].mask(engine_on))

        self.Doc.print("\nEngine-on downhill accel: %.2f"
                                % self.math_df.at[0, "accel_avg_calc_eng_on"])
        self.Doc.print("Engine-off downhill accel: %.2f"
                                % self.math_df.at[0, "accel_avg_calc_eng_off"])

    def plot_data(self, overwrite=False, description=""):
        # This performs all the actions in the parent class's method:
        super(DownhillRun, self).plot_data(overwrite, description)
        self.plot_downhill_range()

    def plot_abridge_compare(self):
        """Creates a plot showing what data was deemed unimportant and removed."""
        ax1 = plt.subplot(211)
        # https://matplotlib.org/3.2.1/api/_as_gen/matplotlib.pyplot.subplot.html
        plt.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["gnd_speed"], color="k")
        plt.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["gs_rolling_avg"], color="c")
        plt.plot(self.sync_df.index/SAMPLING_FREQ,
            self.sync_df["gs_rolling_avg"].mask(~self.sync_df["downhill_filter"]), color="r")

        plt.title("Run %s - Abridge Compare" % self.run_label, loc="left")
        ax1.set_ylabel("Speed (mph)")

        plt.setp(ax1.get_xticklabels(), visible=False) # x labels only on bottom

        ax2 = plt.subplot(212, sharex=ax1)

        plt.plot(self.abr_df.index/SAMPLING_FREQ, self.abr_df["gnd_speed"], color="k")
        plt.plot(self.math_df.index/SAMPLING_FREQ, self.math_df["gs_rolling_avg"], color="c")
        plt.plot(self.math_df.index/SAMPLING_FREQ, self.math_df["gs_rol_avg_mskd"], color="r")

        ax2.set_ylabel("Speed (mph)")
        ax2.set_xlabel("Time (s)")

        # plt.show() # can't use w/ WSL. Export instead.
        # https://stackoverflow.com/questions/43397162/show-matplotlib-plots-and-other-gui-in-ubuntu-wsl1-wsl2
        self.export_plot("abr")
        plt.clf()
        # https://stackoverflow.com/questions/8213522/when-to-use-cla-clf-or-close-for-clearing-a-plot-in-matplotlib

    def plot_downhill_range(self):
        """Creates a plot showing highlighted downhill regions and the data
        used to identify them."""
        ax1 = plt.subplot(311)
        color = "k"
        # https://matplotlib.org/3.1.0/gallery/color/named_colors.html
        ax1.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["gnd_speed"], color=color)
        color = "c"
        ax1.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["gs_rolling_avg"], color=color)
        color = "r"
        ax1.plot(self.sync_df.index/SAMPLING_FREQ,
            self.sync_df["gs_rolling_avg"].mask(~self.sync_df["downhill_filter"]), color=color)
        ax1.set_ylabel("Speed (mph)")
        plt.setp(ax1.get_xticklabels(), visible=False) # x labels only on bottom
        plt.title("Run %s - Downhill Isolation (Unabridged Data)"
                                                % self.run_label, loc="left")

        ax2 = plt.subplot(312, sharex=ax1)
        ax2.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["engine_spd"])
        ax2.set_ylabel("Engine Speed (rpm)")
        plt.setp(ax2.get_xticklabels(), visible=False) # x labels only on bottom

        ax3 = plt.subplot(313, sharex=ax1)
        color = "tab:purple"
        ax3.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["throttle"], color=color)
        ax3.set_ylim([-25, 100]) # Shift throttle trace up
        ax3.set_yticks([0, 20, 40, 60, 80, 100])

        ax3.set_xlabel("Time (s)")
        ax3.set_ylabel("Throttle (deg)", color=color)
        ax3.tick_params(axis="y", labelcolor=color)

        ax3_twin = ax3.twinx() # second plot on same x axis
        # https://matplotlib.org/gallery/api/two_scales.html
        color = "tab:red"
        ax3_twin.plot(self.sync_df.index/SAMPLING_FREQ, self.sync_df["pedal_sw"], color=color)
        ax3_twin.set_ylim([-.25, 8]) # scale down pedal switch
        ax3_twin.set_yticks([0, 1])
        ax3_twin.set_ylabel("Pedal Switch", color=color)
        ax3_twin.tick_params(axis="y", labelcolor=color)

        self.export_plot("downhill")
        plt.clf()

    def get_run_type(self):
        return "DownhillRun"


class Output(object):
    """Object to store terminal output for log dump if needed."""

    def __init__(self, verbose, warn_p):
        self.verbose = verbose
        self.warn_prompt = warn_p
        self.log_string = ""

    def print(self, string, verbose_only=False):
        """Wrapper for standard print function that duplicates output to
        run-specific buffer."""
        if verbose_only and not self.verbose:
            # Add everything to log even if not output to screen.
            self.add_to_log(string)
            return
        else:
            self.add_to_log(string)
            print(string)

    def add_to_log(self, string):
        self.log_string += string + "\n"

    def warn(self, warn_string):
        # Add to log and display in terminal.
        self.print("\nWarning: " + warn_string)
        if self.warn_prompt:
            input("Press Enter to continue.")
        else:
            self.print("") # blank line

    def get_log_dump(self):
        return self.log_string


def main_prog():
    """This program runs when Python runs this file."""
    global LOG_DIR

    # Set up command-line argument parser
    # https://docs.python.org/3/howto/argparse.html
    # If you pass in any arguments from the command line after "python run.py",
    # this interprets them.
    parser = argparse.ArgumentParser(description="Program to preprocess EX1 "
                                                "CVT data for easier analysis")
    parser.add_argument("-a", "--auto", help="Automatically process all data "
                                    "in raw_data folders.", action="store_true")
    parser.add_argument("-o", "--over", help="Overwrite existing data in "
                    "sync_data folder without prompting.", action="store_true")
    parser.add_argument("-p", "--plot", help="Plot data before and after "
                                            "processing.", action="store_true")
    parser.add_argument("-v", "--verbose", help="Include additional output for "
                                            "diagnosis.", action="store_true")
    parser.add_argument("-d", "--desc", help="Specify a description string to "
        "append to output file names - data and plot files (if -p also used)",
                                                        type=str, default="")
    parser.add_argument("-l", "--log-dir", help="Specify a directory where log "
        "file containing that run's output and error trace should be saved when "
                            "error encountered.", type=str, default=LOG_DIR)
    parser.add_argument("-i", "--ignore-warn", help="Do not prompt user to "
                                "acknowledge warnings.", action="store_false")
    parser.add_argument("-s", "--start", help="Specify run number to start with "
        "when processing all runs (with -a option).", type=str, default=False)
    # https://www.programcreek.com/python/example/748/argparse.ArgumentParser
    args = parser.parse_args()

    if os.path.isdir(args.log_dir):
        LOG_DIR = args.log_dir  # update global variable
    else:
        raise FilenameError("Bad log-dir argument. Must be valid path. Aborting.")

    AllRuns = RunGroup(args.auto, args.start, args.verbose, args.ignore_warn)

    if args.plot and PLOT_LIB_PRESENT:
        if not os.path.exists(PLOT_DIR):
            # Create folder for output plots if it doesn't exist already.
            os.mkdir(PLOT_DIR)
        AllRuns.plot_runs(args.over, args.desc)
    elif args.plot:
        print("\nFailed to import matplotlib. Cannot plot data.")

    if not os.path.exists(SYNC_DIR):
        # Create folder for output data if it doesn't exist already.
        os.mkdir(SYNC_DIR)

    AllRuns.export_runs(args.over, args.desc)


if __name__ == "__main__":
    main_prog()