From d518b29e5ad2442950cf9c3cfa76e08c795ccdd5 Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 13:00:44 -0600
Subject: [PATCH 1/8] Add avoid keyword

---
 buildstock_query/aggregate_query.py     |  2 ++
 buildstock_query/aggregate_query.pyi    |  8 ++++++++
 buildstock_query/main.py                | 10 ++++++----
 buildstock_query/query_core.py          | 18 +++++++++++++++++-
 buildstock_query/schema/query_params.py |  1 +
 buildstock_query/schema/run_params.py   |  2 +-
 buildstock_query/schema/utilities.py    |  4 ++--
 7 files changed, 37 insertions(+), 8 deletions(-)

diff --git a/buildstock_query/aggregate_query.py b/buildstock_query/aggregate_query.py
index 222e1a6..e7f25a1 100644
--- a/buildstock_query/aggregate_query.py
+++ b/buildstock_query/aggregate_query.py
@@ -71,6 +71,7 @@ def aggregate_annual(self, *,
         restrict = [(self._bsq._bs_completed_status_col, [self._bsq.db_schema.completion_values.success])] + restrict
         query = self._bsq._add_join(query, join_list)
         query = self._bsq._add_restrict(query, restrict)
+        query = self._bsq._add_avoid(query, params.avoid)
         query = self._bsq._add_group_by(query, group_by_selection)
         query = self._bsq._add_order_by(query, group_by_selection if params.sort else [])
 
@@ -190,6 +191,7 @@ def aggregate_timeseries(self, params: TSQuery):
             params.restrict = list(params.restrict) + [(self._bsq._ts_upgrade_col, [upgrade_id])]
 
         query = self._bsq._add_restrict(query, params.restrict)
+        query = self._bsq._add_avoid(query, params.avoid)
         query = self._bsq._add_group_by(query, group_by_selection)
         query = self._bsq._add_order_by(query, group_by_selection if params.sort else [])
         query = query.limit(params.limit) if params.limit else query
diff --git a/buildstock_query/aggregate_query.pyi b/buildstock_query/aggregate_query.pyi
index 90eec8e..8fdcf7c 100644
--- a/buildstock_query/aggregate_query.pyi
+++ b/buildstock_query/aggregate_query.pyi
@@ -21,6 +21,7 @@ class BuildStockAggregate:
                          join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = [],
                          weights: Sequence[Union[str, tuple]] = [],
                          restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
+                         avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
                          get_quartiles: bool = False,
                          get_nonzero_count: bool = False,
                          ) -> str:
@@ -36,6 +37,7 @@ class BuildStockAggregate:
                          join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = [],
                          weights: Sequence[Union[str, tuple]] = [],
                          restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
+                         avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
                          get_quartiles: bool = False,
                          get_nonzero_count: bool = False,
                          ) -> pd.DataFrame:
@@ -51,6 +53,7 @@ class BuildStockAggregate:
                          join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = [],
                          weights: Sequence[Union[str, tuple]] = [],
                          restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
+                         avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
                          get_quartiles: bool = False,
                          get_nonzero_count: bool = False,
                          ) -> Union[pd.DataFrame, str]:
@@ -79,6 +82,8 @@ class BuildStockAggregate:
 
             restrict: The list of where condition to restrict the results to. It should be specified as a list of tuple.
                     Example: `[('state',['VA','AZ']), ("build_existing_model.lighting",['60% CFL']), ...]`
+            avoid: Just like restrict, but the opposite. It will only include rows that do not match (any of) the
+                   conditions.
             get_quartiles: If true, return the following quartiles in addition to the sum for each enduses:
                         [0, 0.02, .25, .5, .75, .98, 1]. The 0% quartile is the minimum and the 100% quartile
                         is the maximum.
@@ -109,6 +114,7 @@ class BuildStockAggregate:
                              join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = [],
                              weights: Sequence[Union[str, tuple]] = [],
                              restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
+                             avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
                              split_enduses: bool = False,
                              collapse_ts: bool = False,
                              timestamp_grouping_func: Optional[str] = None,
@@ -125,6 +131,7 @@ class BuildStockAggregate:
                              join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = [],
                              weights: Sequence[Union[str, tuple]] = [],
                              restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
+                             avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
                              split_enduses: bool = False,
                              collapse_ts: bool = False,
                              timestamp_grouping_func: Optional[str] = None,
@@ -143,6 +150,7 @@ class BuildStockAggregate:
                              join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = [],
                              weights: Sequence[Union[str, tuple]] = [],
                              restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
+                             avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = [],
                              split_enduses: bool = False,
                              collapse_ts: bool = False,
                              timestamp_grouping_func: Optional[str] = None,
diff --git a/buildstock_query/main.py b/buildstock_query/main.py
index 017061d..b24c49b 100644
--- a/buildstock_query/main.py
+++ b/buildstock_query/main.py
@@ -40,11 +40,12 @@ def __init__(self,
                  table_name: Union[str, tuple[str, Optional[str], Optional[str]]],
                  db_schema: Optional[str] = None,
                  buildstock_type: Literal['resstock', 'comstock'] = 'resstock',
-                 sample_weight: Optional[Union[int, float]] = None,
+                 sample_weight_override: Optional[Union[int, float]] = None,
                  region_name: str = 'us-west-2',
                  execution_history: Optional[str] = None,
                  skip_reports: bool = False,
                  athena_query_reuse: bool = True,
+                 **kwargs,
                  ) -> None:
         """A class to run Athena queries for BuildStock runs and download results as pandas DataFrame.
 
@@ -60,8 +61,8 @@ def __init__(self,
                 It is also different between the version in OEDI and default version from BuildStockBatch. This argument
                 controls the assumed schema. Allowed values are 'resstock_default', 'resstock_oedi', 'comstock_default'
                 and 'comstock_oedi'. Defaults to 'resstock_default' for resstock and 'comstock_default' for comstock.
-            sample_weight (str, optional): Specify a custom sample_weight. Otherwise, the default is 1 for ComStock and
-                uses sample_weight in the run for ResStock.
+            sample_weight_override (str, optional): Specify a custom sample_weight. Otherwise, the default is 1 for
+                ComStock and uses sample_weight in the run for ResStock.
             region_name (str, optional): the AWS region where the database exists. Defaults to 'us-west-2'.
             execution_history (str, optional): A temporary file to record which execution is run by the user,
                 to help stop them. Will use .execution_history if not supplied. Generally, not required to supply a
@@ -71,6 +72,7 @@ def __init__(self,
             athena_query_reuse (bool, optional): When true, Athena will make use of its built-in 7 day query cache.
                 When false, it will not. Defaults to True. One use case to set this to False is when you have modified
                 the underlying s3 data or glue schema and want to make sure you are not using the cached results.
+            kargs: Any other extra keyword argument supported by the QueryCore can be supplied here
         """
         db_schema = db_schema or f"{buildstock_type}_default"
         self.params = BSQParams(
@@ -79,7 +81,7 @@ def __init__(self,
             buildstock_type=buildstock_type,
             table_name=table_name,
             db_schema=db_schema,
-            sample_weight_override=sample_weight,
+            sample_weight_override=sample_weight_override,
             region_name=region_name,
             execution_history=execution_history,
             athena_query_reuse=athena_query_reuse
diff --git a/buildstock_query/query_core.py b/buildstock_query/query_core.py
index 49d7d15..ee285d1 100644
--- a/buildstock_query/query_core.py
+++ b/buildstock_query/query_core.py
@@ -972,7 +972,7 @@ def _simple_label(self, label: str):
         label = label.removeprefix(self.db_schema.column_prefix.output)
         return label
 
-    def _add_restrict(self, query, restrict, bs_only=False):
+    def _add_restrict(self, query, restrict, *, bs_only=False):
         if not restrict:
             return query
         where_clauses = []
@@ -988,6 +988,22 @@ def _add_restrict(self, query, restrict, bs_only=False):
         query = query.where(*where_clauses)
         return query
 
+    def _add_avoid(self, query, avoid, *, bs_only=False):
+        if not avoid:
+            return query
+        where_clauses = []
+        for col_str, criteria in avoid:
+            col = self._get_column(col_str, table_name=self.bs_table) if bs_only else self._get_column(col_str)
+            if isinstance(criteria, (list, tuple)):
+                if len(criteria) > 1:
+                    where_clauses.append(self._get_column(col).not_in(criteria))
+                    continue
+                else:
+                    criteria = criteria[0]
+            where_clauses.append(col != criteria)
+        query = query.where(*where_clauses)
+        return query
+
     def _get_name(self, col):
         if isinstance(col, tuple):
             return col[1]
diff --git a/buildstock_query/schema/query_params.py b/buildstock_query/schema/query_params.py
index 3644656..a4f1d4e 100644
--- a/buildstock_query/schema/query_params.py
+++ b/buildstock_query/schema/query_params.py
@@ -11,6 +11,7 @@ class AnnualQuery(BaseModel):
     sort: bool = True
     join_list: Sequence[tuple[AnyTableType, AnyColType, AnyColType]] = Field(default_factory=list)
     restrict: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = Field(default_factory=list)
+    avoid: Sequence[tuple[AnyColType, Union[str, int, Sequence[Union[int, str]]]]] = Field(default_factory=list)
     weights: Sequence[Union[str, tuple, AnyColType]] = Field(default_factory=list)
     get_quartiles: bool = False
     get_nonzero_count: bool = False
diff --git a/buildstock_query/schema/run_params.py b/buildstock_query/schema/run_params.py
index aa49c8f..95fefca 100644
--- a/buildstock_query/schema/run_params.py
+++ b/buildstock_query/schema/run_params.py
@@ -8,7 +8,7 @@ class RunParams(BaseModel):
     db_name: str
     table_name: Union[str, tuple[str, Optional[str], Optional[str]]]
     buildstock_type: Literal['resstock', 'comstock'] = 'resstock'
-    db_schema: Optional[str] = 'resstock_raw'
+    db_schema: Optional[str] = None
     sample_weight_override: Optional[Union[int, float]] = None
     region_name: str = 'us-west-2'
     execution_history: Optional[str] = None
diff --git a/buildstock_query/schema/utilities.py b/buildstock_query/schema/utilities.py
index 381752d..b1860df 100644
--- a/buildstock_query/schema/utilities.py
+++ b/buildstock_query/schema/utilities.py
@@ -2,13 +2,13 @@
 from typing import Union, Any, Sequence
 from pydantic import BaseModel
 import sqlalchemy as sa
-from sqlalchemy.sql.elements import Label
+from sqlalchemy.sql.elements import Label, ColumnElement
 from sqlalchemy.sql.selectable import Subquery
 
 # from buildstock_query import BuildStockQuery  # can't import due to circular import
 
 
-SACol = sa.Column
+SACol = Union[sa.Column, ColumnElement]
 SALabel = Label
 DBColType = Union[SALabel,  SACol]
 DBTableType = sa.Table

From bf11859cf8f866794f3bb72c7ce1c86a1807696c Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 13:01:19 -0600
Subject: [PATCH 2/8] Utility query fixes

---
 buildstock_query/utility_query.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/buildstock_query/utility_query.py b/buildstock_query/utility_query.py
index db767ad..a2f68d6 100644
--- a/buildstock_query/utility_query.py
+++ b/buildstock_query/utility_query.py
@@ -165,14 +165,14 @@ def aggregate_ts_by_eiaid(self, params: UtilityTSQuery):
                                          params=params)
 
     @validate_arguments(config=dict(arbitrary_types_allowed=True, smart_union=True))
-    def aggregate_unit_counts_by_eiaid(self, *, eiaid_list: list[str],
+    def aggregate_unit_counts_by_eiaid(self, *, eiaid_list: Optional[list[str]] = None,
                                        group_by: list[Union[AnyColType, tuple[str, str]]] = [],
                                        get_query_only: bool = False):
         """
         Returns the counts of the number of dwelling units, grouping by eiaid and other additional group_by columns if
         provided.
         Args:
-            eiaid_list: The list of utility ids (EIAID) to aggregate for
+            eiaid_list: The list of utility ids (EIAID) to aggregate for. If not provided, all the eiaids will be used.
             group_by: Additional columns to group by
             mapping_version: Version of eiaid mapping to use. After the spatial refactor upgrade, version two
                              should be used
@@ -185,7 +185,7 @@ def aggregate_unit_counts_by_eiaid(self, *, eiaid_list: list[str],
         group_by = group_by or []
         eiaid_map_table_name, map_baseline_column, map_eiaid_column = self.get_eiaid_map()
         group_by = [] if group_by is None else group_by
-        restrict = [('eiaid', eiaid_list)]
+        restrict = [('eiaid', eiaid_list)] if eiaid_list else []
         eiaid_col = self._bsq._get_column("eiaid", eiaid_map_table_name)
         result = self._agg.aggregate_annual(enduses=[], group_by=[eiaid_col] + group_by,
                                             sort=True,

From 44cdac7632512e504c1ef8ceac0f1eece5acbe73 Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 13:01:54 -0600
Subject: [PATCH 3/8] Upgrades visualizer simplification

---
 .../upgrades_visualizer.py                    | 85 ++++++++++++-------
 .../tools/upgrades_visualizer/viz_data.py     | 56 ++++++++----
 2 files changed, 95 insertions(+), 46 deletions(-)

diff --git a/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py b/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
index f3ff5ca..ab18f4f 100644
--- a/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
+++ b/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
@@ -35,8 +35,6 @@
 # ])
 transforms = [MultiplexerTransform()]
 
-# yaml_path = "/Users/radhikar/Documents/eulpda/EULP-data-analysis/notebooks/EUSS-project-file-example.yml"
-yaml_path = "/Users/radhikar/Documents/largee/resstock/project_national/fact_sheets_category_1.yml"
 opt_sat_path = "/Users/radhikar/Downloads/options_saturations.csv"
 default_end_use = "fuel_use_electricity_total_m_btu"
 
@@ -56,12 +54,40 @@ def filter_cols(all_columns, prefixes=[], suffixes=[]):
     return cols
 
 
-def _get_app(yaml_path: str, opt_sat_path: str, db_name: str = 'euss-tests',
+def get_int_set(input_str):
+    """
+        Convert "1,2,3-6,8,9" to [1, 2, 3, 4, 5, 6, 8, 9]
+    """
+    if not input_str:
+        return set()
+
+    pattern = r'^(\d+(-\d+)?,)*(\d+(-\d+)?)$'
+    if not re.match(pattern, input_str):
+        raise ValueError(f"{input_str} is not a valid pattern for list")
+
+    result = set()
+    segments = input_str.split(',')
+    for segment in segments:
+        if '-' in segment:
+            start, end = map(int, segment.split('-'))
+            result |= set(range(start, end + 1))
+        else:
+            result.add(int(segment))
+
+    return result
+
+
+def _get_app(opt_sat_path: str, db_name: str = 'euss-tests',
              table_name: str = 'res_test_03_2018_10k_20220607',
              workgroup: str = 'largeee',
-             buildstock_type: str = 'resstock'):
-    viz_data = VizData(yaml_path=yaml_path, opt_sat_path=opt_sat_path, db_name=db_name,
-                       run=table_name, workgroup=workgroup, buildstock_type=buildstock_type)
+             buildstock_type: str = 'resstock',
+             include_monthly: bool = True,
+             upgrades_selection_str: str = ''):
+    viz_data = VizData(opt_sat_path=opt_sat_path, db_name=db_name,
+                       run=table_name, workgroup=workgroup, buildstock_type=buildstock_type,
+                       include_monthly=include_monthly,
+                       upgrades_selection=get_int_set(upgrades_selection_str)
+                       )
     return get_app(viz_data)
 
 
@@ -93,7 +119,8 @@ def get_buildings(upgrade):
         return upgrade2res[int(upgrade)]['building_id'].to_list()
 
     def get_plot(end_use, value_type='mean', savings_type='', change_type='',
-                 sync_upgrade=None, filter_bldg=None, group_cols=None, report_upgrade=None):
+                 sync_upgrade=None, filter_bldg=None, group_cols=None, report_upgrade=None,
+                 resolution='annual'):
         filter_bldg = filter_bldg or []
         group_cols = group_cols or []
         sync_upgrade = sync_upgrade or 0
@@ -115,7 +142,7 @@ def get_plot(end_use, value_type='mean', savings_type='', change_type='',
         dbc.Row([dbc.Col(html.H1("Upgrades Visualizer"), width='auto'), dbc.Col(html.Sup("beta"))]),
         # Add a row for annual, vs monthly vs seasonal plot radio buttons
         dbc.Row([dbc.Col(dbc.Label("Resolution: "), width='auto'),
-                 dbc.Col(dcc.RadioItems(["annual", "monthly"], "annual",
+                 dbc.Col(dcc.RadioItems(["annual", "monthly"] if viz_data.include_monthly else ["annual"], "annual",
                                         inline=True, id="radio_resolution"))]),
 
         dbc.Row([dbc.Col(dbc.Label("Visualization Type: "), width='auto'),
@@ -278,7 +305,7 @@ def download_char(n_clicks, bldg_id, bldg_options, bldg_options2, chk_chars):
         bdf = viz_data.upgrade2res[0].filter(pl.col("building_id").is_in(set(bldg_ids))).select(char_cols)
         return dcc.send_bytes(bdf.write_csv, f"chars_{n_clicks}.csv")
 
-    def get_elligible_output_columns(category, fuel):
+    def get_elligible_output_columns(category, fuel, resolution):
         if category == 'energy':
             elligible_cols = viz_data.get_cleaned_up_end_use_cols(resolution, fuel)
         elif category == 'water':
@@ -304,15 +331,6 @@ def get_elligible_output_columns(category, fuel):
             raise ValueError(f"Invalid tab {category}")
         return elligible_cols
 
-    @app.callback(
-        Output('radio_resolution', 'options'),
-        Input('radio_resolution', 'value'),
-    )
-    def update_resolution(res):
-        nonlocal resolution
-        resolution = res
-        return ['annual', 'monthly']
-
     @app.callback(
         Output('dropdown_enduse', "options"),
         Output('dropdown_enduse', "value"),
@@ -322,7 +340,7 @@ def update_resolution(res):
         Input('radio_resolution', 'value')
     )
     def update_enduse_options(view_tab, fuel_type, current_enduse, resolution):
-        elligible_cols = get_elligible_output_columns(view_tab, fuel_type)
+        elligible_cols = get_elligible_output_columns(view_tab, fuel_type, resolution)
         enduse = current_enduse if current_enduse in elligible_cols else elligible_cols[0]
         return sorted(elligible_cols), enduse
 
@@ -772,11 +790,12 @@ def show_char_report(bldg_id, bldg_options, bldg_options2, inp_char: list[str],
         Input('input_building2', 'options'),
         Input('chk-graph', 'value'),
         State("uirevision", "data"),
-        State('report_upgrade', 'value')
+        State('report_upgrade', 'value'),
+        State('radio_resolution', 'value')
     )
     def update_figure(view_tab, grp_by, fuel, enduse, graph_type, savings_type, chng_type,
                       sync_upgrade, selected_bldg, bldg_options, bldg_options2, chk_graph, uirevision,
-                      report_upgrade):
+                      report_upgrade, resolution):
         nonlocal download_csv_df
         if dash.callback_context.triggered_id == 'input_building2' and "Graph" not in chk_graph:
             raise PreventUpdate()
@@ -798,7 +817,8 @@ def update_figure(view_tab, grp_by, fuel, enduse, graph_type, savings_type, chng
             filter_bldg = [int(b) for b in bldg_options]
 
         new_figure, report_df = get_plot(full_name, graph_type, savings_type,
-                                         chng_type, sync_upgrade, filter_bldg, grp_by, report_upgrade)
+                                         chng_type, sync_upgrade, filter_bldg, grp_by, report_upgrade,
+                                         resolution)
 
         uirevision = uirevision or "default"
         new_figure.update_layout(uirevision=uirevision)
@@ -813,8 +833,6 @@ def update_figure(view_tab, grp_by, fuel, enduse, graph_type, savings_type, chng
 def main():
     print("Welcome to Upgrades Visualizer.")
     defaults = load_script_defaults("project_info")
-    yaml_file = inquirer.text(message="Please enter path to the buildstock configuration yml file: ",
-                              default=defaults.get("yaml_file", "")).execute()
     opt_sat_file = inquirer.text(message="Please enter path to the options saturation csv file: ",
                                  default=defaults.get("opt_sat_file", "")).execute()
     workgroup = inquirer.text(message="Please Athena workgroup name: ",
@@ -827,16 +845,25 @@ def main():
                                "separated by comma if baseline and upgrades are in different run] :",
                                default=defaults.get("table_name", "")
                                ).execute()
-    defaults.update({"yaml_file": yaml_file, "opt_sat_file": opt_sat_file, "workgroup": workgroup,
-                     "db_name": db_name, "table_name": table_name})
+    monthly_default = defaults.get("include_monthly", True)
+    include_monthly = inquirer.confirm(f"Do you want to include monthly data ({monthly_default})?",
+                                       default=monthly_default,
+                                       ).execute()
+    upgrades_selection = inquirer.text(message="Please enter upgrade ids separated by comma and dashes (example: 1-3,5,7,8-9) "
+                                       "or leave empty to include all upgrades.",
+                                       default=defaults.get("upgrades_selection", "")).execute()
+    defaults.update({"opt_sat_file": opt_sat_file, "workgroup": workgroup,
+                     "db_name": db_name, "table_name": table_name, "include_monthly": include_monthly,
+                     "upgrades_selection": upgrades_selection})
     save_script_defaults("project_info", defaults)
     if ',' in table_name:
         table_name = table_name.split(',')
-    app = _get_app(yaml_path=yaml_file,
-                   opt_sat_path=opt_sat_file,
+    app = _get_app(opt_sat_path=opt_sat_file,
                    workgroup=workgroup,
                    db_name=db_name,
-                   table_name=table_name)
+                   table_name=table_name,
+                   include_monthly=include_monthly,
+                   upgrades_selection_str=upgrades_selection)
     app.run_server(debug=False, port=8005)
 
 
diff --git a/buildstock_query/tools/upgrades_visualizer/viz_data.py b/buildstock_query/tools/upgrades_visualizer/viz_data.py
index ea73cce..b000afb 100644
--- a/buildstock_query/tools/upgrades_visualizer/viz_data.py
+++ b/buildstock_query/tools/upgrades_visualizer/viz_data.py
@@ -3,6 +3,7 @@
 import polars as pl
 from buildstock_query.tools.upgrades_visualizer.plot_utils import PlotParams
 from typing import Union
+import datetime
 
 num2month = {1: "January", 2: "February", 3: "March", 4: "April",
              5: "May", 6: "June", 7: "July", 8: "August",
@@ -12,12 +13,14 @@
 
 class VizData:
     @validate_arguments(config=dict(arbitrary_types_allowed=True, smart_union=True))
-    def __init__(self, yaml_path: str, opt_sat_path: str,
+    def __init__(self, opt_sat_path: str,
                  db_name: str,
                  run: Union[str, tuple[str, str]],
                  workgroup: str = 'largeee',
                  buildstock_type: str = 'resstock',
-                 skip_init: bool = False):
+                 skip_init: bool = False,
+                 include_monthly: bool = True,
+                 upgrades_selection: set = set()):
         if isinstance(run, tuple):
             # Allows for separate baseline and upgrade runs
             # In this case, run[0] is the baseline run and run[1] is the upgrade run
@@ -39,24 +42,30 @@ def __init__(self, yaml_path: str, opt_sat_path: str,
                                         buildstock_type=buildstock_type,
                                         table_name=table,
                                         skip_reports=skip_init)
-        self.yaml_path = yaml_path
         self.opt_sat_path = opt_sat_path
+        self.upgrades_selection = upgrades_selection
+        self.include_monthly = include_monthly
         if not skip_init:
             self.initialize()
 
     def initialize(self):
-        self.ua = self.main_run.get_upgrades_analyzer(yaml_file=self.yaml_path,
-                                                      opt_sat_file=self.opt_sat_path)
+        available_upgrades = self.main_run.get_available_upgrades()
+        available_upgrades = [int(u) for u in available_upgrades]
+        if (unavailable_upgrades := self.upgrades_selection - set(available_upgrades)):
+            raise ValueError(f"Upgrades {unavailable_upgrades} is not available in the run")
+        available_upgrades = self.upgrades_selection
         self.report = pl.from_pandas(self.main_run.report.get_success_report(), include_index=True)
-        self.available_upgrades = list(sorted(set(self.report["upgrade"].unique()) - {0}))
-        self.upgrade2name = {indx+1: f"Upgrade {indx+1}: {upgrade['upgrade_name']}" for indx,
-                             upgrade in enumerate(self.ua.cfg.get('upgrades', []))}
-        self.upgrade2name[0] = "Upgrade 0: Baseline"
-        self.upgrade2shortname = {indx+1: f"Upgrade {indx+1}" for indx,
-                                  upgrade in enumerate(self.ua.cfg.get('upgrades', []))}
+        self.available_upgrades = list(set([int(u) for u in available_upgrades]) - {0})
+        self.upgrade2name = {0: "Upgrade 0: Baseline"}
+        if self.available_upgrades:
+            upgrade_names = self.main_run.get_upgrade_names()
+            self.upgrade2name |= upgrade_names
+
+        self.upgrade2shortname = {indx+1: f"Upgrade {indx+1}" for indx in range(len(self.available_upgrades) + 1)}
         self.chng2bldg = self.get_change2bldgs()
         self.init_annual_results()
-        self.init_monthly_results(self.metadata_df)
+        if self.include_monthly:
+            self.init_monthly_results(self.metadata_df)
         self.all_upgrade_plotting_df = None
 
     def run_obj(self, upgrade: int) -> BuildStockQuery:
@@ -122,10 +131,23 @@ def init_monthly_results(self, metadata_df):
             ts_cols = self._get_ts_enduse_cols(upgrade)
             print(f"Getting monthly results for {upgrade}")
             run_obj = self.run_obj(upgrade)
-            monthly_vals = run_obj.agg.aggregate_timeseries(enduses=ts_cols,
-                                                            group_by=[run_obj.bs_bldgid_column],
-                                                            upgrade_id=upgrade,
-                                                            timestamp_grouping_func='month')
+            monthly_vals_query = run_obj.agg.aggregate_timeseries(get_query_only=True,
+                                                                  enduses=ts_cols,
+                                                                  group_by=[run_obj.bs_bldgid_column],
+                                                                  upgrade_id=upgrade,
+                                                                  timestamp_grouping_func='month',
+                                                                  )
+            month_year = f"{datetime.datetime.now().strftime('%b%Y')}"
+            s3_unload_path = f"s3://resstock-core/athena_unload_results/{month_year}/"
+            if monthly_vals_query in run_obj._query_cache:
+                monthly_vals = run_obj._query_cache[monthly_vals_query].copy()
+            else:
+                pd_cursor = run_obj._conn.cursor(unload=True, s3_staging_dir=s3_unload_path).execute(
+                    monthly_vals_query,
+                    result_reuse_enable=True,
+                    result_reuse_minutes=60 * 24 * 7)
+                monthly_vals = pd_cursor.as_pandas()
+                run_obj._query_cache[monthly_vals_query] = monthly_vals
             run_obj.save_cache()
             monthly_df = pl.from_pandas(monthly_vals, include_index=True)
             monthly_df = monthly_df.with_columns(pl.col('time').dt.month().alias("month"))
@@ -193,7 +215,7 @@ def get_plotting_df(self, upgrade: int,
                 .then(0)
                 .otherwise(pl.col("value"))
                 .alias("value")
-                )
+            )
         return up_df
 
     def get_all_cols(self, resolution: str) -> list[str]:

From d16242dc593073b0b2892adddb15812100c23fc4 Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 13:05:49 -0600
Subject: [PATCH 4/8] Style fixes

---
 .../tools/upgrades_visualizer/upgrades_visualizer.py         | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py b/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
index ab18f4f..c489429 100644
--- a/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
+++ b/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
@@ -96,7 +96,6 @@ def get_app(viz_data: VizData):
     upgrade2res = viz_data.upgrade2res
     # upgrade2res_monthly = viz_data.upgrade2res_monthly
     upgrade2name = viz_data.upgrade2name
-    resolution = 'annual'
     all_cols = viz_data.upgrade2res[0].columns
     emissions_cols = filter_cols(all_cols, suffixes=['_lb'])
     # end_use_cols = filter_cols(all_cols, ["end_use_", "energy_use__", "fuel_use_"])
@@ -849,8 +848,8 @@ def main():
     include_monthly = inquirer.confirm(f"Do you want to include monthly data ({monthly_default})?",
                                        default=monthly_default,
                                        ).execute()
-    upgrades_selection = inquirer.text(message="Please enter upgrade ids separated by comma and dashes (example: 1-3,5,7,8-9) "
-                                       "or leave empty to include all upgrades.",
+    upgrades_selection = inquirer.text(message="Please enter upgrade ids separated by comma and dashes "
+                                       " (example: 1-3,5,7,8-9) or leave empty to include all upgrades.",
                                        default=defaults.get("upgrades_selection", "")).execute()
     defaults.update({"opt_sat_file": opt_sat_file, "workgroup": workgroup,
                      "db_name": db_name, "table_name": table_name, "include_monthly": include_monthly,

From cf07677784b5f5447ed7fd99767356504b8fecbd Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 13:25:44 -0600
Subject: [PATCH 5/8] Update test

---
 tests/test_BuildStockQuery.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_BuildStockQuery.py b/tests/test_BuildStockQuery.py
index b051385..6231c26 100644
--- a/tests/test_BuildStockQuery.py
+++ b/tests/test_BuildStockQuery.py
@@ -247,7 +247,7 @@ def test_aggregate_annual(temp_history_file):
         db_name='buildstock_testing',
         buildstock_type='resstock',
         table_name='res_n250_hrly_v1',
-        sample_weight=29.1,
+        sample_weight_override=29.1,
         execution_history=temp_history_file,
         skip_reports=True
     )
@@ -390,7 +390,7 @@ def test_aggregate_ts(temp_history_file):
         buildstock_type='resstock',
         table_name='res_n250_hrly_v1',
         execution_history=temp_history_file,
-        sample_weight=29.1,
+        sample_weight_override=29.1,
         skip_reports=True
     )
     my_athena2.get_available_upgrades = lambda: ['0']

From e72a6b9741a6828df3741c5785e6a8d9fd7b306e Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 14:48:50 -0600
Subject: [PATCH 6/8] Update reference files

---
 ...17d2f98a99ed74388852ac9b8f_query_cache.pkl | Bin 2191086 -> 2191940 bytes
 ...all_run_baseline_20230810_100_baseline.pkl | Bin 509209 -> 509228 bytes
 ...l_run_baseline_20230810_100_timeseries.pkl | Bin 281083 -> 281083 bytes
 ...all_run_category_1_20230616_timeseries.pkl | Bin 497674 -> 497693 bytes
 ...small_run_category_1_20230616_upgrades.pkl | Bin 509476 -> 509492 bytes
 5 files changed, 0 insertions(+), 0 deletions(-)

diff --git a/tests/reference_files/c2e8c98cee7aca046d23eaea93afcb1393eda217d2f98a99ed74388852ac9b8f_query_cache.pkl b/tests/reference_files/c2e8c98cee7aca046d23eaea93afcb1393eda217d2f98a99ed74388852ac9b8f_query_cache.pkl
index 418d92c3b8fba0490e39f054c8db868e983d4b28..e447ad330f03ed4be903e557a48de1790b485c6f 100644
GIT binary patch
delta 577
zcmZ`#OD_Xa6gI<9Iz_$fQ5Or-Xqt$X1tLvKNR?PvNpowicBJ#j?VZIeD9Ncr*v-iN
z50Ti4_yb}o7Q({H53n-R6h)lPJ?DF!-1GKW;cj0l+#ztlLnAbS0L{<>0ceFb2!aS9
zXon8ygfMhLH}pU+^g%xiKm-P12!>$<qA&{RatssxLA<(t7Pnj7Yi%rEKD%#2b+t)~
zWQU<0Tw;=G<SCX3!X>0=jN}Q8`F#zJBTRD&qnKLKI5v!;m8~&}+MCs|O2+FwRpiIM
zrd_J5_C{cG>Ia;sx@n-Cg{F~CWkRd%m%?5=o#F)dW{sCP>HLnD+}8tcz(d3gKbc4h
z4SqSy$rV!jP9aiQi5)p!;|<bTP%~A-%F4_#h_m-Dx;VqnmW5-dAfIe|e1D2~`*0DZ
z6-`l16)h9Y6fN)kWs<sHtTGe-co5cP^rag4t=huO`<b6VSB;tZEvT)Ie`a_m_X59d
dzKbx&ewtqjiS<Xfxr?ZsUI@FZ>wJ_q6CaS5!W94j

delta 94
zcmX@|q?PgA-B!ki7RDB)7UmX~7S<NF7WNj77S0x~7VZ|F7Ty-V7XB827Qq&w7U33=
y7SR^57V#E|7ReT=7U>q57TFfL7Wo#1EsBY$Os$;T4?O0H<(z&XPf>@dR1X01rXM~4

diff --git a/tests/reference_files/small_run_baseline_20230810_100_baseline.pkl b/tests/reference_files/small_run_baseline_20230810_100_baseline.pkl
index 9df5da78f4eb803a199f1c92711f6c3aa266d0f9..8c430b4fb7752cc0ac70fcec6522ef95f2f1886b 100644
GIT binary patch
delta 1591
zcmaKsTWkzr6vsRJot?eeHcj1Hnr4Hw8f|q^T_RO+4Jr{{1Y=t()3M!cw{2V#4;rmz
zBPpvNq0*3$u&QzCajnIJdyshGfgtfFf(TF4H?#B2Y^CuqJ7>>1|KE4MlR4*DXHl}V
zsQ(EB98yb@6b{yg!iji}6p2Qpp!%bG+|t%qv_Xp2DxtcT=0w~nHO8Vlc1qhqI}iVa
zN#o_Zu7n)kn2<?Oj&#V|<U+ZDJ<8=Os{}qhQ16o!7HW{gazqnonJMN-u|O;ypwE93
z-{mik*ePpR<?Rb4+e1kKLrF{aI;ZB+j-c-s5f9xg5(l0Y$YCL!ja7vFv}C4zh>9L$
zX}v<Gw+Tow{X|6{Zm^Tsu+WP&qKEb$6HCzRWT7;dGHw|@b&;cj!>EDI=n>cAUH6E9
zT;fDIhm6~rd2IiX#Y1ZZ+f;nnYOrzHc2e4**S~v+^by@ICGbo?f4~Zl`4yjw@RZxV
zc6g}U-By@NAJ}0u4HGE9droN8BXsW~$fxV`ARFsO!4a<g?S?^ar*hy9&wex(ym&4b
z4)I`h9^BXM?&>tjjb&p@5>s5uRMVkCu;Z2S(8;|F;nln}aN6R+Jq1PxT@&FEKj}>&
zyy6m8l9!(FFwpxV=;B_-OjaE8Qtn7C<P~k21PKoMH5u-4d(aChp3VGac*zI+d!eSh
zvDlDj+;X~cOQVZ!+Fu4%{83_7Wl~s(7hzJO<pu@W1#a_dOxd?th73C^V1U=YxYFz_
zYe+s$m<wn0Ame-S^E?y1e?A}=F06v<x;;=0H@Tagc!S&QtGLDO1xw%px4$nnF@4M7
zD)-APj9PHYD##Iv!)$ERQ_QAYsaTqom7aX%^UAC&xgq^hr+OCswiXKM#y`Y``)eRq
zC^rQoZUn`-N+W15l`tcN@O3rBvo%6H%L>XP6JDnY+Dj$ONfRD#f(`bH%F3AmzrUQ8
zN-%razx?(#3D{%BHc9L#*C#QzOXOpQ?+%GW7Pr0x6s-cPE*W(fm13Y<Y!&{As>=r1
zvgy$~N&lP_ry*N0r?`VL{giDNFJ3&(^!lmOdc+spW|Cx3*mdN*t@R(ex>Jzt6pt_}
zvnaZ9JMrTMi;W&AQJek0R()*OnytMQY>L}te_q_RCDdFOt8Z+nk46&8LDo%tGiZAY
LLKyMBtycI86aqq=

delta 1571
zcmaKsO-vI}5XafR>GlH(A%3C~(x9cHd?SL!AO=MvXkzeUgtd_B+CnQ;qDB)B5<t=m
zT6y4Cj3%0BLE;DFCssWuh*1*{deEq6V$>KtDZbtA+pWfU*uL5S%>3TG*PV&>WDWFW
z4L^lNc4=2AxNpDY_wJ8`ZPK1Lsm0UeZHdUu;WQ}_3`id3N7asjIolO>NZUifRw>xz
z^EU6<9qEn8frf}oJaTKd+#+YnKKA&pRhlJmYmS|6Ci>-O=5Cb(EJ2NoF)_yEP`H9V
z|4H1}KG{O&%!)g3*c<KgMg{anO{tshs-$i~-&YeS-6j$nUKGeNAs&sDgnTz8hJ6T%
zPGn(cg+#RtNG_II$%#MI7n?*U9Uc(#&}Anf4M`cY04I`3zhKk1r-i4*dVJtuQHj_%
zAf4DzP9w9nC%T5GOisE%u;k#&cAbrD_mcc>t@Hy^WQb^XK7nW2{v&1>=cjuv!UVU^
zTH%Ri_n9GwKDNSi+CpFsKD0x-=AnnGA%kw22C3Mb0>^poPX~;0JC+9bdGy#!aN(tN
zILe(>)8LV2_f^G74lI~qkXXje#B4g130Ay58+y3P5H3}v73WRKcyNyH!sK}{#&>#?
z39onxE6GJqIT`4E7W8t}R>F#7D&<0K6|bl<8zLO^V?I3O_NWVDJeuhRc-0O3Q=vxs
zu3SAm;gpN@Q|h<qpu+`V#&3B>RR)E*co7CASfo>s9pE0X#z^~8s;6O38I17SSC<<%
z%Pu4X=PrW_nv?NeIJw+Fcdh{BiK{B%mS&Gs!5uEM9dC1+eHC}Py>bl<a{FtIff-r{
zH@GgZ*K5HAb&w|H8V$@E+gDbTloW4z-(+o4lI)8wN<){@FZGZ~8-9^w?A!q9LXna1
z&tc%R*Qo?`Q3!<zgwGoxoT?JKSd>TpH{o@hpe_nwX`C?L2wSa7OUf%s3Jc3<z64AD
zc+2SOkbpgA?2yFnBCQkCdqv)6`0l7UWpZdkz^7I~mHDEKp?s|96WfKqyvm%RY|gmR
z(a*ebCjE6rT!?JWoZ|um7gIK3TzKWA9)=4~i!b;;z*3?fVaM^ymiE84PzDRK!QvEB
u5-X#%dr2`4nk@84o^s>=yRVO3>W!<5AKStfxfmx$EpI{a<M<;>lkgk#3OP~$

diff --git a/tests/reference_files/small_run_baseline_20230810_100_timeseries.pkl b/tests/reference_files/small_run_baseline_20230810_100_timeseries.pkl
index a420564cd541c087dab81bd648bb6e3d74f80075..c02d4a2966791eb14013ad9942765e227e56e3ae 100644
GIT binary patch
delta 199
zcmex8S@8E{!42*n+MMwvh4DFwNvSzgdidk>^7G;oK?Fo3Bcq2azMv?-qB1@^wQ_Qi
zhl*O_#3>mWu~Rab6SI8T7#KRTyn$qv5s2`Cv%EI%@z}?xnvnrkGjR&C(g?UxFw1N6
hd@nIB>`FP<VWxsvUd^{c+HZw00x{F}TOrJfUjbZgJC^_e

delta 199
zcmex8S@8E{!42*n+FbDkMfnw#@!6@BQ+hb#OA6z25|dJMreq}c@W<!n=fx+22(Z}X
zA`ca{jEPe+GGeD>FehgDvN14pWcdKeEF%!%1!sA0-s7>4Q5CEr1E>R8X#`v;nB~2B
hzLyvmcBLHbFjK)S@8(+}?YBZ0ftYFgtq^9#uK-=gJC^_e

diff --git a/tests/reference_files/small_run_category_1_20230616_timeseries.pkl b/tests/reference_files/small_run_category_1_20230616_timeseries.pkl
index 75e0621db77ef1dabe4307327442b7f86ffe1cbd..8e3150eeec01b46d9de63cf8ffc209acff3dc1fe 100644
GIT binary patch
delta 477
zcmeC$AUAh|+=h#8+MMwvh4DFwNvSzgdidk>^7G;oK?Fo3Bcq2azMv?-qB1@^wQ}+w
zHx;$SiBmE%Vy9#<CuZrgF)(ywX#>eDArPShXK8JAbKl3P0~X2104vM@YDCsy0oMU$
zX>B&}6lF8bfEWTY8KePZQ&t_2gJM}XTq~HRwYkdQkp-`1Z{a$?EUo6}!R^n38G)E-
z`}1IC;~!@DoO<0C<~cA+3uKrfkmxa=esL<h?DSk8mKY8*3kzdQBO}A<7kyYvQFxN=
z>b@*M%(`9Omo0xYbNzINsf8?}Ti3C-#^H7K!*-axV3yYQ_;~hQBjFzIl+@znqRfJl
b%>2A5S-n8lZ9g-S{VEG%&h|yq*fSUbLEnUb

delta 457
zcmbQcL9T0q+=h#8+FbDkMfnw#@!6@BQ+hb#OA6z25|dJMreq}c@W<!n=fx+22(Z}X
zKW-{&855^uWW-L%U{1`^Wn*CI$kG9lSwbK}3(nHs?B>3YQ70o2A`4QO0n~`B!vd}Y
z%+lU$;3>*xilzZ%Q&t^NC5mO;aIIjL_U0;oM;5%6y@l%lv$UI^2e&^DW&~oU?azam
zjenTobLw?pnCHMOZIEGxK%&Qddf-%c+3C4HEHNDB#uk>w1_ox+FZ!^UqVOc!)qPoj
zn033lFI)a*=A7vaQwv!{x2|Jvjl=8ehwU(X!7T0V@$u}rM%(XCWWUP7n7w`LH1-Te
E00EJF<p2Nx

diff --git a/tests/reference_files/small_run_category_1_20230616_upgrades.pkl b/tests/reference_files/small_run_category_1_20230616_upgrades.pkl
index 5739188a75f6765199bdddc63848c9e24aabc2f8..8d8aaeb16e2f43ad2af84d40ebfb0282064ab9df 100644
GIT binary patch
delta 2421
zcmZXWUu;ul6u{Se%l+1ZEILZrw1e0O7b%thu1puPJP@KLh>3}Uwd*Q(TSvQYm`yZh
z*8Pd8gV~aAn4w}f!RhGMwLKFam}{a4@_>XFjYd<S_Mjm~pQiEaJuTe!JT$jCzu$Mx
z`TpE~os4cwM>o#SFtf?i+wBQ>Tm6C9O}1{W*%Jx}`}#ed{{Fa{jQ!3Yekf}81-nAt
zu(vlDj*rFF%!oR##?-X<q+-_U7Y*51usTq^yQyi1Yy0+XF`KC_wo+YpHxRLzhHWMT
z*i6!j<NmCArNjA1Rn=hp`M5gQsAl2O-O`dli@#D9|Mzj}A4!X!E{hwRrEk#Bl*NB~
zLi!HlxAk$}vQKjGt<91NmRqD#X#8Dfh)TO)@hRy8!-IwPERDMM)TEel@<?2j`C_N?
z0(||n6u=z2^csjN*F0LcOONS>L*1m*g#OQE@zyEn;7EN^&8XSpns!{<Q&pv=@sZ*;
zw#Y6+7MN2$>)cal%i4S|Z%S-IQfvW^7VUMI1odir)3IKB6?wEr3Vt~(Z!$KN73xDl
zd!*E_qAtGeWx0{>^U51U#UoxhlF(+du>W4g?C>3<QG8ax9iwvaC5;~r>o^zO0;)%u
z$LYRFAYX1*?A+s$)<DRsT*kefr`q~vX+NB4Q-YZ27BRs2nsN!@UlguYl`O*A9@3v^
zVFBR|3a@r5mk}N!kc+hS{Ml~B3^%%zDZjP=dry!8<F}Mq%;BZ**loqQ*>EY-!~8xi
zLH#@W1Op??0{{8gDOrO)3e!hfvHb{v+#X~bV7i^1#rg?iKvyRNggFWibg|;r<tY@o
zGdNO?RJP26F=hozH!Hqec4ENwF#8;by9wkgA2T!WkFon;u9wA7^HFW$Em39QbrwY<
zLJj}h!Z^^!I2s9Re1A@qni&(N8s1<hQOi+HE46&0R4Pvl5Jm!r%kNgM2Z%l{BD7QJ
z8enOJZVGE7><U63fx30787!?+glKSeh+V)O2|WaHx{5DNP9NumQ^!}0vQ04X9(x~0
z=7|A2qwEWW@*tV97(Rp0UI`uW=Sen-&|L{Fys#r6c4Pt#A2C3juJZ^ZmCyl)PM2~g
zDk0`B?l!->+f)+^W`*T(HilL5m4*WrJ}gy{hsfLm6YLz0v=hk1IWfbNAF(rNxQPMc
z^iL!7Q7BgDGlUTe#}n*Rgb4~?onn&+a|9L^-3oipm)0b&H{iDmrE?+=S5CI@s+-~Z
zbm=$7P7E0Rl8s|wH-*n!EVb;TaNR8Xq&Qg$f1E45a0vqWx0_`fUz}$@v=lDNoKBz@
z<r?whR=g;egeWdb?NPV~ck-KC<OcX7&76kv8}nB*wMW6+s+nAvt80#jj)uK${`hl4
hg}*de2xnQcrZ&2|&EMk-w}*P$gU90P1IJsP{{xdR&N2W1

delta 2420
zcmZXWUu;ul6u{Se%l+1hE(A;2Ob4+KE>h~ufKjH4SRM#b6U4+s!P=F|rR&zM46}*G
z%(_1@bue4<4Kq~iCO94Y)7zaX56m@D1bI-xgBp#dZ+p-XqfgWL-Fw<`+w;)f<@|o%
zIp_Ox`&CPBnMiJ#oo3DUKvz80+ZSjL_ob7zKu>od8f*(k(@A?M*3lJ=2YX`ibh0MU
z8S4xL^*@MHKe7ims57H!bzxY|sVQ|{e6lHL_45`j6|0U`H#hC}H8nQwO1W&csnzP*
zwLrpU8*<q!;Ic`po(-CMHR64!s%jwpY+9XbP&IgXm$Ym#;xCoO|8183k&O7+vbeQH
z`WpRQS^Ve6q;D~P+Z^Yu`y>x<Y>{lR(kh)n<L@#<RN4tkPe|`s9?;u!G?>~mraW^b
zt;&3<U3m_^dQysFj-6%=M3w6Squb?2Ov9meLfVb~FJ<wzN$KElT~1wCThqw(Jylie
zJU+7g=62a<(SUj7^WHsrTh5lddFR!vs)=pD(W1SGP0*mRH<3-^Uy;XnWZ~Dt@>Xko
zN!2$m(u;!e$f{o?ef-fE<p#blC~p=Oj|AmJ#+b?C{<{^mp*vQq_^g9FR^{Le20t7(
zaW1$6)PR!3>Ap@NUpcP0dB7*FhpwP<1@|^fwM{M3emHkjiD9B!!~pLr%9jZLqVPUd
zSwOh)1nEz-u!yjU!fWly6@-Tf<RWbyf4W<-!_5w5GHfis-czK&*ezuia|9{uyscQb
zS*CI)SU6-PsC&ztpnsS-;J*+%BO5S8p>~WF+fNY4-7&TqrjE1oSU*Dy=xAqvFi+uu
z4p!W{0)--X4oAv~%9eR7#hl>iX2qAwO$@jZXP@G5KY@JpLuTiFDRwW+^{^CbA*zkP
zA*%Gh%93a#s1bfs7zcV8M<YXx?=FZ^)1#tP{cG$rYI&*|rB+UrN)?C!!pPuo`R&T}
z0MW-~gl-Cb{Y*pXr*LC}T}2oo(6ml91EqCJ5Dl&kvP+mFV}>A3SMjCEo8w$Rb$s0j
z+Y0^fuy=7}ff%qO$v#6U50Dv);nN7+mCyr!o@OHm{gu$c^&J7RBjad<hymhsT|}6u
zgdR9_wv;<l2{CtZxB1#`Q%x+G6IRC9C{`&{8Xj1Dzf?sYBy*3BvkN%VO&}NN#14;t
zz|NuJCkBYqKZP(vp;(<y5GE)b%dn3TW+;4ll1(7Y6R0n`6ZT##tx3Ub!0(qz=R_W=
zoUHz;+u_Dk={v?v3>f*GjbULwg-=~BwH%`G{#o`>ak3QtG*^1zG6eE(w#hEOlx07(
z>KA3+B+!d;z4&q~UX;s16c?rO(C@(={QK>4J^Z0DuciFP{0&Xxp_`3{$%T1O&B?A~
Y@!-*L`k6ufCyfU21vXP7pKSB~580p1tN;K2


From 97e587ebff46bf830e34aa53b300c7779efceeea Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 14:51:33 -0600
Subject: [PATCH 7/8] Update test files

---
 buildstock_query/tools/upgrades_visualizer/viz_data.py | 6 ++++--
 tests/generate_reference_viz_data_files.py             | 2 --
 tests/test_Viz.py                                      | 2 --
 3 files changed, 4 insertions(+), 6 deletions(-)

diff --git a/buildstock_query/tools/upgrades_visualizer/viz_data.py b/buildstock_query/tools/upgrades_visualizer/viz_data.py
index b000afb..76a1b1a 100644
--- a/buildstock_query/tools/upgrades_visualizer/viz_data.py
+++ b/buildstock_query/tools/upgrades_visualizer/viz_data.py
@@ -51,6 +51,8 @@ def __init__(self, opt_sat_path: str,
     def initialize(self):
         available_upgrades = self.main_run.get_available_upgrades()
         available_upgrades = [int(u) for u in available_upgrades]
+        if not self.upgrades_selection:
+            self.upgrades_selection = set(available_upgrades)
         if (unavailable_upgrades := self.upgrades_selection - set(available_upgrades)):
             raise ValueError(f"Upgrades {unavailable_upgrades} is not available in the run")
         available_upgrades = self.upgrades_selection
@@ -137,11 +139,11 @@ def init_monthly_results(self, metadata_df):
                                                                   upgrade_id=upgrade,
                                                                   timestamp_grouping_func='month',
                                                                   )
-            month_year = f"{datetime.datetime.now().strftime('%b%Y')}"
-            s3_unload_path = f"s3://resstock-core/athena_unload_results/{month_year}/"
             if monthly_vals_query in run_obj._query_cache:
                 monthly_vals = run_obj._query_cache[monthly_vals_query].copy()
             else:
+                month_year = f"{datetime.datetime.now().strftime('%b%Y')}"
+                s3_unload_path = f"s3://resstock-core/athena_unload_results/{month_year}/"
                 pd_cursor = run_obj._conn.cursor(unload=True, s3_staging_dir=s3_unload_path).execute(
                     monthly_vals_query,
                     result_reuse_enable=True,
diff --git a/tests/generate_reference_viz_data_files.py b/tests/generate_reference_viz_data_files.py
index fd74591..52b671c 100644
--- a/tests/generate_reference_viz_data_files.py
+++ b/tests/generate_reference_viz_data_files.py
@@ -18,10 +18,8 @@ def save_bsq_obj(bsq_obj: BuildStockQuery, cache_name=None):
 
 def save_viz_data_reference_data():
     folder_path = pathlib.Path(__file__).parent.resolve()
-    yaml_path = str(folder_path / "reference_files" / "example_category_1.yml")
     opt_sat_path = str(folder_path / "reference_files" / "options_saturations.csv")
     viz_data = VizData(
-        yaml_path=yaml_path,
         opt_sat_path=opt_sat_path,
         workgroup='largeee',
         db_name='largeee_test_runs',
diff --git a/tests/test_Viz.py b/tests/test_Viz.py
index 93d7d24..e040278 100644
--- a/tests/test_Viz.py
+++ b/tests/test_Viz.py
@@ -20,10 +20,8 @@ class TestViz:
     @pytest.fixture(scope='class')
     def viz_data(self):
         folder_path = pathlib.Path(__file__).parent.resolve()
-        yaml_path = str(folder_path / "reference_files" / "example_category_1.yml")
         opt_sat_path = str(folder_path / "reference_files" / "options_saturations.csv")
         mydata = VizData(
-            yaml_path=yaml_path,
             opt_sat_path=opt_sat_path,
             workgroup='largeee',
             db_name='largeee_test_runs',

From 6c3056adbb74fc0e92724454282f082586f9ec5e Mon Sep 17 00:00:00 2001
From: Rajendra Adhikari <rajendraadhikari.ee@gmail.com>
Date: Thu, 1 Feb 2024 15:10:16 -0600
Subject: [PATCH 8/8] Prompt formatting fixes

---
 .../upgrades_visualizer/upgrades_visualizer.py    | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py b/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
index c489429..564b259 100644
--- a/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
+++ b/buildstock_query/tools/upgrades_visualizer/upgrades_visualizer.py
@@ -832,24 +832,25 @@ def update_figure(view_tab, grp_by, fuel, enduse, graph_type, savings_type, chng
 def main():
     print("Welcome to Upgrades Visualizer.")
     defaults = load_script_defaults("project_info")
-    opt_sat_file = inquirer.text(message="Please enter path to the options saturation csv file: ",
+    opt_sat_file = inquirer.text(message="Please enter path to the options saturation csv file:",
                                  default=defaults.get("opt_sat_file", "")).execute()
-    workgroup = inquirer.text(message="Please Athena workgroup name: ",
+    workgroup = inquirer.text(message="Please enter Athena workgroup name:",
                               default=defaults.get("workgroup", "")).execute()
-    db_name = inquirer.text(message="Please enter database_name "
-                            "(found in postprocessing:aws:athena in the buildstock configuration file): ",
+    db_name = inquirer.text(message="Please enter database name "
+                            "(found in postprocessing:aws:athena in the buildstock configuration file):",
                             default=defaults.get("db_name", "")).execute()
     table_name = inquirer.text(message="Please enter table name (same as output folder name; found under "
                                "output_directory in the buildstock configuration file). [Enter two names "
-                               "separated by comma if baseline and upgrades are in different run] :",
+                               "separated by comma if baseline and upgrades are in different run]:",
                                default=defaults.get("table_name", "")
                                ).execute()
     monthly_default = defaults.get("include_monthly", True)
-    include_monthly = inquirer.confirm(f"Do you want to include monthly data ({monthly_default})?",
+    default_str = "Yes" if monthly_default else "No"
+    include_monthly = inquirer.confirm(f"Do you want to include monthly plots ({default_str})?",
                                        default=monthly_default,
                                        ).execute()
     upgrades_selection = inquirer.text(message="Please enter upgrade ids separated by comma and dashes "
-                                       " (example: 1-3,5,7,8-9) or leave empty to include all upgrades.",
+                                       "(example: `1-3,5,7,8-9`) or leave empty to include all upgrades.",
                                        default=defaults.get("upgrades_selection", "")).execute()
     defaults.update({"opt_sat_file": opt_sat_file, "workgroup": workgroup,
                      "db_name": db_name, "table_name": table_name, "include_monthly": include_monthly,