Breakthrough-Energy · BainanXia · Mar 5, 2021 · Mar 2, 2021 · Mar 2, 2021 · Mar 4, 2021
diff --git a/postreise/plot/demo/pie_generation_vs_capacity.ipynb b/postreise/plot/demo/pie_generation_vs_capacity.ipynb
diff --git a/postreise/plot/plot_pie_generation_vs_capacity.py b/postreise/plot/plot_pie_generation_vs_capacity.py
@@ -0,0 +1,248 @@
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+from powersimdata.input.grid import Grid
+from powersimdata.network.usa_tamu.constants.plants import type2color, type2label
+from powersimdata.network.usa_tamu.usa_tamu_model import area_to_loadzone
+from powersimdata.scenario.scenario import Scenario
+
+from postreise.analyze.generation.capacity_value import sum_capacity_by_type_zone
+from postreise.analyze.generation.summarize import sum_generation_by_type_zone
+
+
+def plot_pie_generation_vs_capacity(
+    areas,
+    area_types=None,
+    scenario_ids=None,
+    scenario_names=None,
+    time_range=None,
+    time_zone=None,
+    custom_data=None,
+    resource_labels=None,
+    resource_colors=None,
+    min_percentage=0,
+):
+    """Plot any number of scenarios as pie charts with two columns per scenario -
+    generation and capacity.
+
+    :param list/str areas: list of area(s), each area is one of *loadzone*, *state*,
+        *state abbreviation*, *interconnect*, *'all'*
+    :param list/str area_types: list of area_type(s), each area_type is one of
+        *'loadzone'*, *'state'*, *'state_abbr'*, *'interconnect'*, defaults to None.
+    :param int/list/str scenario_ids: list of scenario id(s), defaults to None.
+    :param list/str scenario_names: list of scenario name(s) of same len as scenario
+        ids, defaults to None
+    :param tuple time_range: [start_timestamp, end_timestamp] where each time stamp
+        is pandas.Timestamp/numpy.datetime64/datetime.datetime. If None, the entire
+        time range is used for the given scenario.
+    :param str time_zone: new time zone, defaults to None, which uses UTC.
+    :param list custom_data: list of dictionaries with each element being
+        hand-generated data as returned by
+        :func:`postreise.plot_bar_generation_vs_capacity.make_gen_cap_custom_data`,
+        defaults to None.
+    :param dict resource_labels: a dictionary with keys being resource types and values
+        being labels, which is used to customize resource labels for selected resource
+        types to show in the plots. Defaults to None, in which case a default set of
+        labels is used.
+    :param dict resource_colors: a dictionary with keys being resource types and values
+        being colors, which is used to customize resource colors for selected resource
+        types to show in the plots. Defaults to None, in which case a default set of
+        colors is used.
+    :param float min_percentage: roll up small pie pieces into a single category,
+        resources with percentage less than the set value will be pooled together,
+        defaults to 0.
+    :raises ValueError:
+        if length of area_types and areas is different and/or
+        if length of scenario_names and scenario_ids is different and/or
+        if less than two scenario_ids and/or custom_data in total is provided.
+    :raises TypeError:
+        if resource_labels are provided but not in a dictionary format and/or
+        if resource_colors are provided but not in a dictionary format.
+
+    .. note::
+        if one wants to plot scenario data and custom data together, custom data MUST be
+        in TWh for generation and GW for capacity in order to conduct appropriate
+        comparison.
+    """
+    if isinstance(areas, str):
+        areas = [areas]
+    if isinstance(area_types, str):
+        area_types = [area_types]
+    if not area_types:
+        area_types = [None] * len(areas)
+    if len(areas) != len(area_types):
+        raise ValueError(
+            "ERROR: if area_types are provided, number of area_types must match number of areas"
+        )
+
+    if not scenario_ids:
+        scenario_ids = []
+    if isinstance(scenario_ids, (int, str)):
+        scenario_ids = [scenario_ids]
+    if isinstance(scenario_names, str):
+        scenario_names = [scenario_names]
+    if scenario_names and len(scenario_names) != len(scenario_ids):
+        raise ValueError(
+            "ERROR: if scenario names are provided, number of scenario names must match number of scenario ids"
+        )
+    if not custom_data:
+        custom_data = {}
+    if len(scenario_ids) + len(custom_data) <= 1:
+        raise ValueError(
+            "ERROR: must include at least two scenario ids and/or custom data"
+        )
+    if not resource_labels:
+        resource_labels = dict()
+    if not isinstance(resource_labels, dict):
+        raise TypeError("ERROR: resource_labels should be a dictionary")
+    if not resource_colors:
+        resource_colors = dict()
+    if not isinstance(resource_colors, dict):
+        raise TypeError("ERROR: resource_colors should be a dictionary")
+
+    type2label.update(resource_labels)
+    type2color.update(resource_colors)
+
+    grid = Grid(["USA"])
+    id2loadzone = grid.id2zone
+    all_loadzone_data = {}
+    scenario_data = {}
+    for i, sid in enumerate(scenario_ids):
+        scenario = Scenario(sid)
+        all_loadzone_data[sid] = {
+            "gen": sum_generation_by_type_zone(scenario, time_range, time_zone).rename(
+                columns=id2loadzone
+            ),
+            "cap": sum_capacity_by_type_zone(scenario).rename(columns=id2loadzone),
+        }
+        scenario_data[sid] = {
+            "name": scenario_names[i] if scenario_names else scenario.info["name"],
+            "gen": {"label": "Generation", "unit": "TWh", "data": {}},
+            "cap": {"label": "Capacity", "unit": "GW", "data": {}},
+        }
+    for area, area_type in zip(areas, area_types):
+        loadzone_set = area_to_loadzone(grid, area, area_type)
+        for sid in scenario_ids:
+            scenario_data[sid]["gen"]["data"][area] = (
+                all_loadzone_data[sid]["gen"][loadzone_set]
+                .sum(axis=1)
+                .divide(1e6)
+                .astype("float")
+                .round(2)
+                .to_dict()
+            )
+            scenario_data[sid]["cap"]["data"][area] = (
+                all_loadzone_data[sid]["cap"][loadzone_set]
+                .sum(axis=1)
+                .divide(1e3)
+                .astype("float")
+                .round(2)
+                .to_dict()
+            )
+    for c_data in custom_data:
+        scenario_data[c_data["name"]] = c_data
+
+    for area in areas:
+        ax_data_list = []
+        for sd in scenario_data.values():
+            for side in ["gen", "cap"]:
+                ax_data, labels = _roll_up_small_pie_wedges(
+                    sd[side]["data"][area], min_percentage
+                )
+
+                ax_data_list.append(
+                    {
+                        "title": "{0}\n{1}".format(sd["name"], sd[side]["label"]),
+                        "labels": labels,
+                        "values": list(ax_data.values()),
+                        "colors": [type2color[r] for r in ax_data.keys()],
+                        "unit": sd[side]["unit"],
+                    }
+                )
+
+        _construct_pie_visuals(area, ax_data_list)
+
+
+def _roll_up_small_pie_wedges(resource_data, min_percentage):
+    """Combine small wedges into a single category. Removes wedges with value 0.
+
+    :param dict resource_data: values for each resource type.
+    :param float min_percentage: roll up small pie pieces into a single category,
+        resources with percentage less than the set value will be pooled together,
+        defaults to 0.
+    :return: (*dict*) -- returns updated axis data and a list of labels that includes
+        the small category label if it exists
+    """
+    resource_list = list(resource_data.keys())
+    total_resources = sum(resource_data.values())
+
+    small_categories = []
+    small_category_value = 0
+    small_category_label = ""
+    for resource in resource_list:
+        percentage = round(resource_data[resource] / total_resources * 100, 1)
+        if percentage == 0.0:
+            resource_data.pop(resource)
+        elif percentage <= min_percentage:
+            small_categories.append(resource)
+            small_category_label += "{0} {1}%\n".format(
+                type2label[resource], percentage
+            )
+            small_category_value += resource_data[resource]
+
+    if len(small_categories) > 1:
+        for resource in small_categories:
+            resource_data.pop(resource)
+
+    labels = [type2label[resource] for resource in resource_data.keys()]
+
+    if len(small_categories) > 1:
+        resource_data["other"] = small_category_value
+        labels.append(small_category_label)
+
+    return resource_data, labels
+
+
+def _construct_pie_visuals(zone, ax_data_list):
+    """Plot formatted data.
+
+    :param str zone: the zone name
+    :param list ax_data_list: a list of dictionaries with keys being labels,
+        values and colors.
+    """
+    rows = int(len(ax_data_list) / 2)
+    fig, axes = plt.subplots(rows, 2, figsize=(20, 12 * rows))
+    if rows > 1:
+        axes = np.concatenate(axes)
+    plt.suptitle(zone, fontsize=36, verticalalignment="bottom")
+
+    for ax_data, ax in zip(ax_data_list, axes):
+        df = pd.DataFrame({"": ax_data["values"]}, index=ax_data["labels"])
+        df.plot(
+            kind="pie",
+            ax=ax,
+            subplots=True,
+            fontsize=18,
+            autopct="%1.1f%%",
+            startangle=180,
+            pctdistance=0.55,
+            colors=ax_data["colors"],
+            wedgeprops={"edgecolor": "white", "linewidth": 6},
+        )
+        ax.set_title(ax_data["title"], fontsize=30)
+        ax.get_legend().remove()
+        ax.tick_params(axis="y", which="both", left=False)
+        ax.add_artist(plt.Circle((0, 0), 0.70, fc="white"))
+        ax.text(
+            0,
+            0,
+            "{0}\n{1}".format(round(sum(ax_data["values"]), 1), ax_data["unit"]),
+            fontsize=22,
+            verticalalignment="center",
+            horizontalalignment="center",
+            weight="bold",
+            color="lightgray",
+        )
+
+    plt.tight_layout()
+    fig.subplots_adjust(hspace=-0.2)
diff --git a/postreise/plot/tests/test_plot_pie_generation_vs_capacity.py b/postreise/plot/tests/test_plot_pie_generation_vs_capacity.py
@@ -0,0 +1,63 @@
+import pytest
+
+from postreise.plot.plot_pie_generation_vs_capacity import (
+    plot_pie_generation_vs_capacity,
+)
+
+
+def test_handle_plot_inputs_throws_valueError_for_different_length_of_areas_and_area_types():
+    with pytest.raises(ValueError):
+        plot_pie_generation_vs_capacity(
+            areas=["all", "Western", "Texas", "Eastern"],
+            area_types=["interconnect"],
+            scenario_ids=[823, 824],
+            scenario_names=["USA 2016", "USA 2020"],
+            min_percentage=2.5,
+        )
+
+
+def test_handle_plot_inputs_throws_valueError_for_different_length_of_scenario_ids_and_scenario_names():
+    with pytest.raises(ValueError):
+        plot_pie_generation_vs_capacity(
+            areas=["all", "Western", "Texas", "Eastern"],
+            area_types=[None, "interconnect", None, None],
+            scenario_ids=[823, 824],
+            scenario_names=["USA 2016"],
+            min_percentage=2.5,
+        )
+
+
+def test_handle_plot_inputs_throws_valueError_for_less_than_two_scenario_ids_and_custom_data_is_provided():
+    with pytest.raises(ValueError):
+        plot_pie_generation_vs_capacity(
+            areas=["all", "Western", "Texas", "Eastern"],
+            area_types=[None, "interconnect", None, None],
+            scenario_ids=[823],
+            scenario_names=["USA 2016"],
+            min_percentage=2.5,
+        )
+
+
+def test_handle_plot_inputs_throws_typeError_for_resource_labels_not_in_a_dictionary_format():
+    with pytest.raises(TypeError):
+        plot_pie_generation_vs_capacity(
+            areas=["all", "Western", "Texas", "Eastern"],
+            area_types=[None, "interconnect", None, None],
+            scenario_ids=[823, 824],
+            scenario_names=["USA 2016", "USA 2020"],
+            resource_labels=["My Natural Gas", "My Coal"],
+            min_percentage=2.5,
+        )
+
+
+def test_handle_plot_inputs_throws_typeError_for_resource_colors_not_in_a_dictionary_format():
+    with pytest.raises(TypeError):
+        plot_pie_generation_vs_capacity(
+            areas=["all", "Western", "Texas", "Eastern"],
+            area_types=[None, "interconnect", None, None],
+            scenario_ids=[823, 824],
+            scenario_names=["USA 2016", "USA 2020"],
+            resource_labels={"ng": "My Natural Gas", "coal": "My Coal"},
+            resource_colors=["red", "blue", "yellow"],
+            min_percentage=2.5,
+        )