Source code for combinator_functions

import pandas as pd
from itertools import product


[docs]def check_scenario_name(df, scen_name):
    """
    Note:
        This function checks to ensure that all passed DataFrames have a consistent scenario 0.

    Parameters:
        df: A DataFrame which must have a column named "Scenario Name'.\n
        scen_name: The scenario name that should be included in the passed DataFrame as scenario 0.

    Return:
        The passed DataFrame if scen_name is present as scenario 0, an error if not.

    """
    if df['Scenario Name'][0] == scen_name:
        return
    else:
        return print(f'Error:  Scenario 0 Scenario Name should be "{scen_name}"')


[docs]def scrub_data(settings, df):
    """
    Note:
        This function scrubs some records from the passed DataFrame.

    Parameters:
        settings: The SetInputs class.\n
        df: The passed DataFrame.

    Return:
        The passed DataFrame after scrubbing base_scenario_name and some model_year "TOTAL" records.

    """
    df = pd.DataFrame(df.loc[df['Scenario Name'] != settings.base_scenario_name])
    df.drop(columns=['Scenario'], inplace=True)
    if df.columns.tolist().__contains__('Model Year'):
        df = pd.DataFrame(df.loc[df['Model Year'] != 'TOTAL', :])
        df['Model Year'] = df['Model Year'].astype(int)
    return df


[docs]def read_and_combine_files(settings, report_name):
    """
    Parameters:
        settings: The SetInputs class.\n
        report_name: The name of the report(s) to read.

    Return:
        A DataFrame that combines the Framework and NonFramework OEM run results for all runs in the model_runs_to_combine_path_dict.

    """
    return_df = pd.DataFrame()
    for model_runs, files_to_combine in settings.model_runs_to_combine_path_dict.items():
        framework_oem_run = files_to_combine[0]
        nonframework_oem_run = files_to_combine[1]

        framework_oem_report = pd.read_csv(framework_oem_run / f'{report_name}.csv')
        check_scenario_name(framework_oem_report, settings.base_scenario_name)
        framework_oem_report = scrub_data(settings, framework_oem_report)
        framework_oem_scenario_names = [name for name in framework_oem_report['Scenario Name'].unique()]

        nonframework_oem_report = pd.read_csv(nonframework_oem_run / f'{report_name}.csv')
        check_scenario_name(nonframework_oem_report, settings.base_scenario_name)
        nonframework_oem_report = scrub_data(settings, nonframework_oem_report)
        nonframework_oem_scenario_names = [name for name in nonframework_oem_report['Scenario Name'].unique()]

        if framework_oem_scenario_names == nonframework_oem_scenario_names:
            pass
        else:
            print('Error: Scenario Names do not match making combination questionable.')
            exit()

        return_df = pd.concat([return_df, framework_oem_report, nonframework_oem_report], axis=0).reset_index(drop=True)

    return return_df


[docs]def read_files_and_combine_scenarios(settings, report_name):
    """
    Parameters:
        settings: The SetInputs class.\n
        report_name: The name of the report(s) to read.

    Return:
        A DataFrame that combines the Framework and NonFramework OEM scenario results for all runs in the model_runs_with_scenarios_to_combine_path_dict.

    """
    return_df = pd.DataFrame()
    for model_runs, files_to_combine in settings.model_runs_with_scenarios_to_combine_path_dict.items():
        framework_oem_run = files_to_combine[0]
        nonframework_oem_run = files_to_combine[1]

        framework_oem_report = pd.read_csv(framework_oem_run / f'{report_name}.csv')
        check_scenario_name(framework_oem_report, settings.base_scenario_name)
        framework_oem_report = scrub_data(settings, framework_oem_report)
        framework_oem_scenario_names = [name for name in framework_oem_report['Scenario Name'].unique()]

        nonframework_oem_report = pd.read_csv(nonframework_oem_run / f'{report_name}.csv')
        check_scenario_name(nonframework_oem_report, settings.base_scenario_name)
        nonframework_oem_report = scrub_data(settings, nonframework_oem_report)
        nonframework_oem_scenario_names = [name for name in nonframework_oem_report['Scenario Name'].unique()]

        for framework_oem_scenario_name, nonframework_oem_scenario_name in product(framework_oem_scenario_names, nonframework_oem_scenario_names):
            framework = pd.DataFrame(framework_oem_report.loc[framework_oem_report['Scenario Name'] == framework_oem_scenario_name, :])
            nonframework = pd.DataFrame(nonframework_oem_report.loc[nonframework_oem_report['Scenario Name'] == nonframework_oem_scenario_name, :])
            scenario_df = pd.concat([framework, nonframework], axis=0, ignore_index=True)
            scenario_df['Scenario Name'] = f'{framework_oem_scenario_name}_{nonframework_oem_scenario_name}'
            return_df = pd.concat([return_df, scenario_df], axis=0, ignore_index=True)

    return_df = return_df.reset_index(drop=True)

    return return_df


if __name__ == '__main__':
    print('This module does not run as a script.')