Source code for marmot.plottingmodules.ramping

# -*- coding: utf-8 -*-
"""Generator start and ramping plots.

This module creates bar plot of the total volume of generator starts in MW,GW,etc.

@author: Marty Schwarz
"""

import logging
from pathlib import Path
from typing import List

import pandas as pd

import marmot.utils.mconfig as mconfig
from marmot.plottingmodules.plotutils.plot_data_helper import (
    GenCategories,
    PlotDataStoreAndProcessor,
)
from marmot.plottingmodules.plotutils.plot_exceptions import (
    MissingInputData,
    MissingZoneData,
    UnderDevelopment,
)
from marmot.plottingmodules.plotutils.plot_library import PlotLibrary
from marmot.plottingmodules.plotutils.styles import ColorList
from marmot.plottingmodules.plotutils.timeseries_modifiers import (
    set_timestamp_date_range,
)

logger = logging.getLogger("plotter." + __name__)
plot_data_settings: dict = mconfig.parser("plot_data")


[docs]class Ramping(PlotDataStoreAndProcessor):
    """Generator start and ramping plots.

    The ramping.py module contains methods that are
    related to the ramp periods of generators.

    Ramping inherits from the PlotDataStoreAndProcessor class to assist
    in creating figures.
    """

    def __init__(
        self,
        Zones: List[str],
        Scenarios: List[str],
        AGG_BY: str,
        ordered_gen: List[str],
        marmot_solutions_folder: Path,
        gen_categories: GenCategories = GenCategories(),
        color_list: list = ColorList().colors,
        **kwargs,
    ):
        """
        Args:
            Zones (List[str]): List of regions/zones to plot.
            Scenarios (List[str]): List of scenarios to plot.
            AGG_BY (str): Informs region type to aggregate by when creating plots.
            ordered_gen (List[str]): Ordered list of generator technologies to plot,
                order defines the generator technology position in stacked bar and area plots.
            marmot_solutions_folder (Path): Directory containing Marmot solution outputs.
            gen_categories (GenCategories): Instance of GenCategories class, groups generator technologies
                into defined categories.
                Deafults to GenCategories.
            color_list (list, optional): List of colors to apply to non-gen plots.
                Defaults to ColorList().colors.
        """
        # Instantiation of PlotDataStoreAndProcessor
        super().__init__(AGG_BY, ordered_gen, marmot_solutions_folder, **kwargs)

        self.Zones = Zones
        self.Scenarios = Scenarios
        self.gen_categories = gen_categories
        self.color_list = color_list

[docs]    def capacity_started(
        self,
        start_date_range: str = None,
        end_date_range: str = None,
        scenario_groupby: str = "Scenario",
        **_,
    ):
        """Creates bar plots of total thermal capacity started by technology type.

        Each sceanrio is plotted as a separate color grouped bar.

        Args:
            start_date_range (str, optional): Defines a start date at which to
                represent data from.
                Defaults to None.
            end_date_range (str, optional): Defines a end date at which to
                represent data to.
                Defaults to None.
            scenario_groupby (str, optional): Specifies whether to group data by Scenario
                or Year-Sceanrio. If grouping by Year-Sceanrio the year will be identified
                from the timestamp and appeneded to the sceanrio name. This is useful when
                plotting data which covers multiple years such as ReEDS.
                Defaults to Scenario.

                .. versionadded:: 0.10.0

        Returns:
            dict: Dictionary containing the created plot and its data table.
        """
        outputs: dict = {}

        # List of properties needed by the plot, properties are a set of
        # tuples and contain 3 parts:
        # required True/False, property name and scenarios required,
        # scenarios must be a list.
        properties = [
            (True, "generator_Generation", self.Scenarios),
            (True, "generator_Installed_Capacity", self.Scenarios),
        ]

        # Runs get_formatted_data within PlotDataStoreAndProcessor to populate
        # PlotDataStoreAndProcessor dictionary with all required properties,
        # returns a 1 if required data is missing
        check_input_data = self.get_formatted_data(properties)

        if 1 in check_input_data:
            return MissingInputData()

        for zone_input in self.Zones:
            logger.info(f"{self.AGG_BY} = {zone_input}")
            cap_stated_chunks = []

            for scenario in self.Scenarios:
                logger.info(f"Scenario = {str(scenario)}")

                Gen: pd.DataFrame = self["generator_Generation"].get(scenario)
                try:
                    Gen = Gen.xs(zone_input, level=self.AGG_BY)
                except KeyError:
                    logger.warning(f"No installed capacity in : {zone_input}")
                    break

                Cap: pd.DataFrame = self["generator_Installed_Capacity"].get(scenario)
                Cap = Cap.xs(zone_input, level=self.AGG_BY)

                if pd.notna(start_date_range):
                    Gen = set_timestamp_date_range(
                        Gen, start_date_range, end_date_range
                    )
                    if Gen.empty is True:
                        logger.warning("No Generation in selected Date Range")
                        continue

                Gen = Gen.reset_index()
                Gen["year"] = Gen.timestamp.dt.year
                Gen = self.rename_gen_techs(Gen)
                Gen.tech = Gen.tech.astype("category")
                Gen.tech = Gen.tech.cat.set_categories(self.ordered_gen)
                Gen = Gen.rename(columns={"values": "Output (MWh)"})
                # We are only interested in thermal starts/stops.
                Gen = Gen[Gen["tech"].isin(self.gen_categories.thermal)]

                Cap = Cap.reset_index()
                Cap["year"] = Cap.timestamp.dt.year
                Cap = self.rename_gen_techs(Cap)
                Cap = Cap.drop(columns=["timestamp", "units"])
                Cap = Cap.rename(columns={"values": "Installed Capacity (MW)"})
                gen_cap = Gen.merge(Cap, on=["year", "tech", "gen_name"])
                gen_cap = gen_cap.set_index("timestamp")

                gen_cap = self.year_scenario_grouper(
                    gen_cap,
                    scenario,
                    groupby=scenario_groupby,
                    additional_groups=["timestamp", "tech", "gen_name"],
                ).sum()
                unique_idx = list(gen_cap.index.get_level_values("Scenario").unique())
                cap_started_df = pd.DataFrame(
                    columns=gen_cap.index.get_level_values("tech").unique(),
                    index=unique_idx,
                )

                # If split on Year-Scenario we want to loop over individual years
                for scen in cap_started_df.index:
                    df = gen_cap.xs(scen, level="Scenario")
                    # Get list of unique techs by Scenario-year
                    tech_names = df.index.get_level_values("tech").unique()
                    for tech_name in tech_names:
                        stt = df.xs(tech_name, level="tech", drop_level=False)
                        gen_names = stt.index.get_level_values("gen_name").unique()
                        cap_started = 0
                        for gen in gen_names:
                            sgt = stt.xs(gen, level="gen_name").fillna(0)
                            # Check that this generator has some, but not all,
                            # uncommitted hours.
                            if any(sgt["Output (MWh)"] == 0) and not all(
                                sgt["Output (MWh)"] == 0
                            ):
                                for idx in range(len(sgt["Output (MWh)"]) - 1):
                                    if (
                                        sgt["Output (MWh)"].iloc[idx] == 0
                                        and not sgt["Output (MWh)"].iloc[idx + 1] == 0
                                    ):
                                        cap_started = (
                                            cap_started
                                            + sgt["Installed Capacity (MW)"].iloc[idx]
                                        )

                        cap_started_df.loc[scen, tech_name] = cap_started

                cap_stated_chunks.append(cap_started_df)

            cap_started_all_scenarios = pd.concat(cap_stated_chunks).dropna(axis=1)

            if cap_started_all_scenarios.empty == True:
                out = MissingZoneData()
                outputs[zone_input] = out
                continue

            cap_started_all_scenarios = cap_started_all_scenarios.fillna(0)
            unitconversion = self.capacity_energy_unitconversion(
                cap_started_all_scenarios, self.Scenarios
            )

            cap_started_all_scenarios = (
                cap_started_all_scenarios / unitconversion["divisor"]
            )
            Data_Table_Out = cap_started_all_scenarios.T.add_suffix(
                f" ({unitconversion['units']}-starts)"
            )

            # transpose, sets scenarios as columns
            cap_started_all_scenarios = cap_started_all_scenarios.T

            mplt = PlotLibrary()
            fig, ax = mplt.get_figure()
            mplt.barplot(cap_started_all_scenarios, color=self.color_list)

            ax.set_ylabel(
                f"Capacity Started ({unitconversion['units']}-starts)",
                color="black",
                rotation="vertical",
            )

            mplt.add_legend()
            if plot_data_settings["plot_title_as_region"]:
                mplt.add_main_title(zone_input)

            outputs[zone_input] = {"fig": fig, "data_table": Data_Table_Out}
        return outputs

[docs]    def count_ramps(self, **_):
        """Plot under development

        Returns:
            UnderDevelopment(): Exception class, plot is not functional.
        """

        # Plot currently displays the same as capacity_started, this plot needs looking at

        outputs = UnderDevelopment()
        logger.warning("count_ramps is under development")
        return outputs

        outputs: dict = {}

        # List of properties needed by the plot, properties are a set of tuples and
        # contain 3 parts: required True/False, property name and scenarios required,
        # scenarios must be a list.
        properties = [
            (True, "generator_Generation", self.Scenarios),
            (True, "generator_Installed_Capacity", self.Scenarios),
        ]

        # Runs get_formatted_data within PlotDataStoreAndProcessor to populate PlotDataStoreAndProcessor dictionary
        # with all required properties, returns a 1 if required data is missing
        check_input_data = self.get_formatted_data(properties)

        if 1 in check_input_data:
            return MissingInputData()

        for zone_input in self.Zones:
            logger.info(f"Zone =  {zone_input}")
            cap_started_chunk = []

            for scenario in self.Scenarios:

                logger.info(f"Scenario = {str(scenario)}")
                Gen = self["generator_Generation"].get(scenario)
                Gen = Gen.xs(zone_input, level=self.AGG_BY)

                Gen = Gen.reset_index()
                Gen.tech = Gen.tech.astype("category")
                Gen.tech = Gen.tech.cat.set_categories(self.ordered_gen)
                Gen = Gen.rename(columns={"values": "Output (MWh)"})
                Gen = Gen[["timestamp", "gen_name", "tech", "Output (MWh)"]]
                Gen = Gen[
                    Gen["tech"].isin(self.gen_categories.thermal)
                ]  # We are only interested in thermal starts/stops.tops.

                Cap = self["generator_Installed_Capacity"].get(scenario)
                Cap = Cap.xs(zone_input, level=self.AGG_BY)
                Cap = Cap.reset_index()
                Cap = Cap.rename(columns={"values": "Installed Capacity (MW)"})
                Cap = Cap[["gen_name", "Installed Capacity (MW)"]]
                Gen = pd.merge(Gen, Cap, on=["gen_name"])
                Gen.index = Gen.timestamp
                Gen = Gen.drop(columns=["timestamp"])

                # Min = pd.read_hdf(os.path.join(Marmot_Solutions_folder, scenario,"Processed_HDF5_folder", scenario + "_formatted.h5"),"generator_Hours_at_Minimum")
                # Min = Min.xs(zone_input, level = AGG_BY)

                if pd.notna(start_date_range):
                    logger.info(
                        f"Plotting specific date range: \
                    {str(start_date_range)} to {str(end_date_range)}"
                    )
                    Gen = Gen[start_date_range:end_date_range]

                tech_names = Gen["tech"].unique()
                ramp_counts = pd.DataFrame(columns=tech_names, index=[scenario])

                for tech_name in tech_names:
                    stt = Gen.loc[Gen["tech"] == tech_name]

                    gen_names = stt["gen_name"].unique()

                    up_ramps = 0

                    for gen in gen_names:
                        sgt = stt.loc[stt["gen_name"] == gen]
                        if any(sgt["Output (MWh)"] == 0) and not all(
                            sgt["Output (MWh)"] == 0
                        ):  # Check that this generator has some, but not all, uncommitted hours.
                            # print('Counting starts for: ' + gen)
                            for idx in range(len(sgt["Output (MWh)"]) - 1):
                                if (
                                    sgt["Output (MWh)"].iloc[idx] == 0
                                    and not sgt["Output (MWh)"].iloc[idx + 1] == 0
                                ):
                                    up_ramps = (
                                        up_ramps
                                        + sgt["Installed Capacity (MW)"].iloc[idx]
                                    )
                                # print('started on '+ timestamp)
                                # if sgt[0].iloc[idx] == 0 and not idx == 0 and not sgt[0].iloc[idx - 1] == 0:
                                #     stops = stops + 1

                    ramp_counts[tech_name] = up_ramps

                cap_started_chunk.append(ramp_counts)

            cap_started_all_scenarios = pd.concat(cap_started_chunk)

            if cap_started_all_scenarios.empty == True:
                out = MissingZoneData()
                outputs[zone_input] = out
                continue

            cap_started_all_scenarios.index = (
                cap_started_all_scenarios.index.str.replace("_", " ")
            )

            unitconversion = self.capacity_energy_unitconversion(
                cap_started_all_scenarios, self.Scenarios
            )

            cap_started_all_scenarios = (
                cap_started_all_scenarios / unitconversion["divisor"]
            )
            Data_Table_Out = cap_started_all_scenarios.T.add_suffix(
                f" ({unitconversion['units']}-starts)"
            )

            mplt = PlotLibrary()
            fig2, ax = mplt.get_figure()
            cap_started_all_scenarios.T.plot.bar(
                stacked=False,
                color=self.color_list,
                edgecolor="black",
                linewidth="0.1",
                ax=ax,
            )

            ax.set_ylabel(
                f"Capacity Started ({unitconversion['units']}-starts)",
                color="black",
                rotation="vertical",
            )

            # Set x-tick labels
            tick_labels = cap_started_all_scenarios.columns
            mplt.set_barplot_xticklabels(tick_labels)

            ax.legend(
                loc="lower left",
                bbox_to_anchor=(1, 0),
                facecolor="inherit",
                frameon=True,
            )
            if plot_data_settings["plot_title_as_region"]:
                mplt.add_main_title(zone_input)

            outputs[zone_input] = {"fig": fig2, "data_table": Data_Table_Out}
        return outputs

[docs]    def count_starts_single_gen(
        self,
        prop: str = None,
        start_date_range: str = None,
        end_date_range: str = None,
        **_,
    ):
        """Counts the number of times a specified generator turns on during the simulation.

        Args:

            prop (str, optional): Name of the PLEXOS generator.
                Defaults to None.
        Returns:
            dict: Dictionary containing the created plot and its data table.
        """

        outputs: dict = {}

        # List of properties needed by the plot, properties are a set of
        # tuples and contain 3 parts:
        # required True/False, property name and scenarios required,
        # scenarios must be a list.
        properties = [
            (True, "generator_Generation", self.Scenarios),
        ]

        # Runs get_formatted_data within PlotDataStoreAndProcessor to populate
        # PlotDataStoreAndProcessor dictionary with all required properties,
        # returns a 1 if required data is missing
        check_input_data = self.get_formatted_data(properties)

        if 1 in check_input_data:
            return MissingInputData()

        for zone_input in self.Zones:
            logger.info(f"{self.AGG_BY} = {zone_input}")
            cycles_df = pd.DataFrame(
                columns=[prop],
                index=self.Scenarios,
            )

            for scenario in self.Scenarios:
                logger.info(f"Scenario = {str(scenario)}")

                Gen: pd.DataFrame = self["generator_Generation"].get(scenario)
                try:
                    Gen = Gen.xs(prop, level="gen_name")
                except KeyError:
                    logger.warning(f"{prop} has no generation in {zone_input}")
                    break

                if pd.notna(start_date_range):
                    Gen = set_timestamp_date_range(
                        Gen, start_date_range, end_date_range
                    )
                    if Gen.empty is True:
                        logger.warning("No Generation in selected Date Range")
                        continue

                starts = 0
                for idx in range(len(Gen["values"]) - 1):
                    if (
                        Gen["values"].iloc[idx] == 0
                        and not Gen["values"].iloc[idx + 1] == 0
                    ):
                        starts += 1

                cycles_df.loc[scenario, prop] = starts

            if cycles_df.empty == True:
                outputs[zone_input] = MissingZoneData()
                continue

            cycles_df = cycles_df.fillna(0)
            unitconversion = self.capacity_energy_unitconversion(
                cycles_df, self.Scenarios
            )

            cycles_df = cycles_df / unitconversion["divisor"]
            Data_Table_Out = cycles_df.add_suffix("starts")

            mplt = PlotLibrary()
            fig, ax = mplt.get_figure()
            mplt.barplot(cycles_df, color=self.color_list)

            ax.set_ylabel(
                "Number of starts",
                color="black",
                rotation="vertical",
            )

            # mplt.add_legend()
            mplt.add_main_title(prop)

            outputs[zone_input] = {"fig": fig, "data_table": Data_Table_Out}
        return outputs