In compare_results.py, set threshold based on reporting units; refactor some methods; better documentation.

aspeake · aspeake · commit 529c8dad7ffd · 2025-03-17T12:14:49.000-06:00
diff --git a/.github/workflows/integration_tests.yml b/.github/workflows/integration_tests.yml
@@ -55,7 +55,7 @@ jobs:
       - name: Install Python dependencies
         run: |
           python -m pip install --upgrade pip
-          pip install . psrecord
+          pip install ".[dev]" psrecord
       - name: Run and profile workflow
         env:
           branch_ref: ${{ steps.branch_ref.outputs.branch_ref }}
@@ -70,19 +70,17 @@ jobs:
           else
             python tests/integration_testing/run_workflow.py --yaml tests/integration_testing/integration_test.yml
           fi
-          rm -rf ./tests/integration_testing/results/*
           mv ./results/* ./tests/integration_testing/results/
       - name: Compare integration test results
         run: |
-          #FIXME temporarily pull from ci_outputs
-          git fetch origin master ci_outputs
+          git fetch origin master
           branch_name="${{ github.ref }}"
           if [[ $(git diff --exit-code origin/master ./tests/integration_testing/results/agg_results.json ./tests/integration_testing/results/ecm_results.json) ]]; then
             mkdir tests/integration_testing/base_results
-            git show origin/ci_outputs:tests/integration_testing/results/agg_results.json > tests/integration_testing/base_results/agg_results.json
-            git show origin/ci_outputs:tests/integration_testing/results/ecm_results.json > tests/integration_testing/base_results/ecm_results.json
-            git show origin/ci_outputs:tests/integration_testing/results/plots/tech_potential/Summary_Data-TP.xlsx > tests/integration_testing/base_results/Summary_Data-TP.xlsx
-            git show origin/ci_outputs:tests/integration_testing/results/plots/max_adopt_potential/Summary_Data-MAP.xlsx > tests/integration_testing/base_results/Summary_Data-MAP.xlsx
+            git show origin/master:tests/integration_testing/results/agg_results.json > tests/integration_testing/base_results/agg_results.json
+            git show origin/master:tests/integration_testing/results/ecm_results.json > tests/integration_testing/base_results/ecm_results.json
+            git show origin/master:tests/integration_testing/results/plots/tech_potential/Summary_Data-TP.xlsx > tests/integration_testing/base_results/Summary_Data-TP.xlsx
+            git show origin/master:tests/integration_testing/results/plots/max_adopt_potential/Summary_Data-MAP.xlsx > tests/integration_testing/base_results/Summary_Data-MAP.xlsx
 
             python tests/integration_testing/compare_results.py --base-dir tests/integration_testing/base_results --new-dir tests/integration_testing/results
           fi
@@ -98,7 +96,7 @@ jobs:
           git pull origin $branch_ref
           git add ./tests/integration_testing/results/*.json
           if [[ $(git diff --cached --exit-code) ]]; then
-            git add ./tests/integration_testing/results/plots
+            git add ./tests/integration_testing/results/plots/**/*.pdf
             git config --system user.email "github-action@users.noreply.github.com"
             git config --system user.name "GitHub Action"
             git commit -m "Upload results files from CI build"
diff --git a/tests/integration_testing/compare_results.py b/tests/integration_testing/compare_results.py
@@ -3,6 +3,10 @@
 import json
 import re
 from pathlib import Path
+import logging
+from scout.config import LogConfig
+LogConfig.configure_logging()
+logger = logging.getLogger(__name__)
 
 
 class ScoutCompare():
@@ -12,48 +16,71 @@ class ScoutCompare():
     """
 
     @staticmethod
-    def load_json(file_path):
+    def load_json(file_path: Path):
+        """Load json file as dictionary
+
+        Args:
+            file_path (Path): filepath of json file
+
+        Returns:
+            dict: json as a dictionary
+        """
         with open(file_path, 'r') as file:
             return json.load(file)
 
     @staticmethod
-    def load_summary_report(file_path):
+    def load_summary_report(file_path: Path):
+        """Read in a summary report
+
+        Args:
+            file_path (Path): filepath of summary report xlsx
+
+        Returns:
+            pd.DataFrame: summary report DataFrame
+        """
         reports = pd.read_excel(file_path, sheet_name=None, index_col=list(range(5)))
         return reports
 
-    def compare_dict_keys(self, dict1, dict2, paths, path='', key_diffs=None):
+    def compare_dict_keys(self,
+                          dict1: dict,
+                          dict2: dict,
+                          paths: list,
+                          path: str = '',
+                          key_diffs: pd.DataFrame = None):
         """Compares nested keys across two dictionaries by recursively searching each level
 
         Args:
             dict1 (dict): baseline dictionary to compare
             dict2 (dict): new dictionary to compare
             paths (list): paths to the original files from which the dictionaries are imported
-            path (str, optional): current dictionary path at whcih to compare. Defaults to ''.
+            path (str, optional): current dictionary path at which to compare. Defaults to ''.
             key_diffs (pd.DataFrame, optional): existing summary of difference. Defaults to None.
 
         Returns:
             pd.DataFrame: summary of differences specifying the file, the unique keys, and the
                 path that key is found at.
         """
         if key_diffs is None:
-            key_diffs = pd.DataFrame(columns=["Results file", "Unique key", "Found at"])
-        keys1 = set(dict1.keys())
-        keys2 = set(dict2.keys())
+            key_diffs = pd.DataFrame(columns=["Results file", "Unique key(s)", "Found at"])
+        keys1, keys2 = set(dict1.keys()), set(dict2.keys())
         only_in_dict1 = keys1 - keys2
         only_in_dict2 = keys2 - keys1
 
+        # Write report rows if keys differ
+        diff_entries = []
         if only_in_dict1:
-            new_row = pd.DataFrame({"Results file": f"{paths[0].parent.name}/{paths[0].name}",
-                                    "Unique key": str(only_in_dict1),
-                                    "Found at": path[2:]}, index=[0])
-            key_diffs = pd.concat([key_diffs, new_row], ignore_index=True)
+            diff_entries.extend([{"Results file": paths[0].as_posix(),
+                                  "Unique key(s)": str(list(only_in_dict1)),
+                                  "Found at": path[2:]}])
         if only_in_dict2:
-            new_row = pd.DataFrame({"Results file": f"{paths[1].parent.name}/{paths[1].name}",
-                                    "Unique key": str(only_in_dict2),
-                                    "Found at": path[2:]}, index=[0])
-            key_diffs = pd.concat([key_diffs, new_row], ignore_index=True)
+            diff_entries.extend([{"Results file": paths[1].as_posix(),
+                                  "Unique key(s)": str(list(only_in_dict2)),
+                                  "Found at": path[2:]}])
+        if diff_entries:
+            key_diffs = pd.concat([key_diffs, pd.DataFrame(diff_entries)], ignore_index=True)
 
-        for key in keys1.intersection(keys2):
+        # Recursively call if keys intersect
+        for key in keys1 & keys2:
             if isinstance(dict1[key], dict) and isinstance(dict2[key], dict):
                 key_diffs = self.compare_dict_keys(dict1[key],
                                                    dict2[key],
@@ -63,54 +90,82 @@ def compare_dict_keys(self, dict1, dict2, paths, path='', key_diffs=None):
 
         return key_diffs
 
-    def compare_dict_values(self, dict1, dict2, percent_threshold=10, abs_threshold=1000):
+    def compare_dict_values(self, dict1, dict2, percent_threshold=10):
         """Compares values across two dictionary by recursively searching keys until identifying
-            values at common paths. Both thresholds must be met to report results.
+            values at common paths. The percent difference is only reported if the percentage
+            meets or exceeds the threshold and one or both values exceed the absolute value
+            threshold, which depends on the units of the values.
 
         Args:
             dict1 (dict): baseline dictionary to compare
             dict2 (dict): new dictionary to compare
             percent_threshold (int, optional): the percent difference threshold at which
                                                differences are reported. Defaults to 10.
-            abs_threshold (int, optional): the abosolute difference threshold at which differences
-                                           are reported. Defaults to 10.
 
         Returns:
             pd.DataFrame: summary of percent differences that meet thresholds
         """
         diff_report = {}
+        abs_threshold_map = {"USD": 1000, "MMBtu": 1000, "MMTons": 10}
 
-        def compare_recursive(d1, d2, path=""):
+        # Recursively navigate dicts until finding numeric values at the same location to compare
+        def compare_recursive(d1, d2, path="", units=""):
             for key in d1.keys():
                 current_path = f"{path}['{key}']"
+                units = next((unit for unit in abs_threshold_map.keys() if unit in key), units)
+                valid_nums = (int, float)
                 if isinstance(d1[key], dict) and key in d2:
-                    compare_recursive(d1[key], d2[key], current_path)
-                elif isinstance(d1[key], (int, float)) and key in d2:
-                    if isinstance(d2[key], (int, float)):
-                        val1 = d1[key]
-                        val2 = d2[key]
-                        if val1 != 0:
-                            percent_change = ((val2 - val1) / val1) * 100
-                            if (abs(percent_change) >= percent_threshold) and \
-                                    (abs(val1) >= abs_threshold or abs(val2) >= abs_threshold):
-                                diff_report[current_path] = percent_change
+                    compare_recursive(d1[key], d2[key], current_path, units)
+                elif isinstance(d1.get(key), valid_nums) and isinstance(d2.get(key), valid_nums):
+                    val1, val2 = d1[key], d2[key]
+                    if val1 == 0:
+                        percent_change = float("inf") if val2 != 0 else 0
+                    else:
+                        percent_change = ((val2 - val1) / val1) * 100
+                    abs_threshold = abs_threshold_map.get(units, float("inf"))
+                    if (abs(percent_change) >= percent_threshold) and \
+                            (abs(val1) >= abs_threshold or abs(val2) >= abs_threshold):
+                        diff_report[current_path] = {"base": val1,
+                                                     "new": val2,
+                                                     "percent_diff": percent_change}
 
         compare_recursive(dict1, dict2)
         return diff_report
 
-    def split_json_key_path(self, path):
+    def split_json_key_path(self, path: str):
+        """Parse a string of nested keys found in a results json file
+
+        Args:
+            path (str): string of nested keys seperated by brackets
+
+        Returns:
+            list: list of individual keys
+        """
         keys = re.findall(r"\['(.*?)'\]", path)
         if len(keys) == 5:
             keys[4:4] = [None, None, None]
         return keys
 
-    def write_dict_key_report(self, diff_report, output_path):
+    def write_dict_key_report(self, diff_report: pd.DataFrame, output_path: Path):
+        """Writes a dictionary key report to a csv file
+
+        Args:
+            diff_report (pd.DataFrame): report with dictionary key differences
+            output_path (Path): csv output path
+        """
         if diff_report.empty:
+            logger.info(f"No key differences found, {output_path} not written")
             return
         diff_report.to_csv(output_path, index=False)
-        print(f"Wrote dictionary key report to {output_path}")
+        logger.info(f"Wrote dictionary key report to {output_path}")
+
+    def write_dict_value_report(self, diff_report: pd.DataFrame, output_path: Path):
+        """Writes a dictionary value report to a csv file
 
-    def write_dict_value_report(self, diff_report, output_path):
+        Args:
+            diff_report (pd.DataFrame): report with dictionary value differences
+            output_path (Path): csv output path
+        """
         col_headers = [
             "ECM",
             "Markets and Savings Type",
@@ -123,20 +178,30 @@ def write_dict_value_report(self, diff_report, output_path):
         ]
         df = pd.DataFrame(columns=["Results path"], data=list(diff_report.keys()))
         if df.empty:
+            logger.info(f"No changes above the threshold found, {output_path} not written")
             return
         df[col_headers] = df["Results path"].apply(self.split_json_key_path).apply(pd.Series)
-        df["Percent difference"] = [round(diff, 2) for diff in diff_report.values()]
+        df["Percent difference"] = [
+            round(diff_dict["percent_diff"], 2) for diff_dict in diff_report.values()]
+        df["Base value"] = [round(diff_dict["base"], 2) for diff_dict in diff_report.values()]
+        df["New value"] = [round(diff_dict["new"], 2) for diff_dict in diff_report.values()]
         df = df.dropna(axis=1, how="all")
         df.to_csv(output_path, index=False)
-        print(f"Wrote dictionary value report to {output_path}")
+        logger.info(f"Wrote dictionary value report to {output_path}")
 
-    def compare_jsons(self, json1_path, json2_path, output_dir=True):
+    def compare_jsons(self,
+                      json1_path: Path,
+                      json2_path: Path,
+                      percent_threshold: float,
+                      output_dir: Path = None):
         """Compare two jsons and report differences in keys and in values
 
         Args:
             json1_path (Path): baseline json file to compare
             json2_path (Path): new json file to compare
-            write_reports (bool, optional): _description_. Defaults to True.
+            percent_threshold (float): threshold for reporting percent difference if values
+            output_dir (Path, optional): output directory where comparison reports are saved.
+                                         Defaults to None.
         """
         json1 = self.load_json(json1_path)
         json2 = self.load_json(json2_path)
@@ -148,18 +213,21 @@ def compare_jsons(self, json1_path, json2_path, output_dir=True):
         self.write_dict_key_report(key_diffs, output_dir / f"{json2_path.stem}_key_diffs.csv")
 
         # Compare differences in json values
-        val_diffs = self.compare_dict_values(json1, json2)
+        val_diffs = self.compare_dict_values(json1, json2, percent_threshold=percent_threshold)
         self.write_dict_value_report(val_diffs, output_dir / f"{json2_path.stem}_value_diffs.csv")
 
-    def compare_summary_reports(self, report1_path, report2_path, output_dir=None):
+    def compare_summary_reports(self,
+                                report1_path: Path,
+                                report2_path: Path,
+                                output_dir: Path = None):
         """Compare Summary_Data-TP.xlsx and Summary_Data-MAP.xlsx with baseline files
 
         Args:
             report1_path (Path): baseline summary report to compare
             report2_path (Path): new summary report to compare
-            output_dir (Path, optional): _description_. Defaults to None.
+            output_dir (Path, optional): output directory where comparison report is saved.
+                                         Defaults to None.
         """
-
         reports1 = self.load_summary_report(report1_path)
         reports2 = self.load_summary_report(report2_path)
         if output_dir is None:
@@ -170,7 +238,7 @@ def compare_summary_reports(self, report1_path, report2_path, output_dir=None):
                 diff = (100 * (report2 - report1)/report1).round(2)
                 diff = diff.reset_index()
                 diff.to_excel(writer, sheet_name=output_type, index=False)
-        print(f"Wrote Summary_Data percent difference report to {output_path}")
+        logger.info(f"Wrote Summary_Data percent difference report to {output_path}")
 
 
 def main():
@@ -194,10 +262,16 @@ def main():
         new_dir = args.new_dir.resolve()
         agg_json_base = base_dir / "agg_results.json"
         agg_json_new = new_dir / "agg_results.json"
-        compare.compare_jsons(agg_json_base, agg_json_new, output_dir=new_dir)
+        compare.compare_jsons(agg_json_base,
+                              agg_json_new,
+                              percent_threshold=args.threshold,
+                              output_dir=new_dir)
         ecm_json_base = base_dir / "ecm_results.json"
         ecm_json_new = new_dir / "ecm_results.json"
-        compare.compare_jsons(ecm_json_base, ecm_json_new, output_dir=new_dir)
+        compare.compare_jsons(ecm_json_base,
+                              ecm_json_new,
+                              percent_threshold=args.threshold,
+                              output_dir=new_dir)
 
         summary_tp_base = base_dir / "Summary_Data-TP.xlsx"
         summary_tp_new = new_dir / "plots" / "tech_potential" / "Summary_Data-TP.xlsx"
@@ -208,7 +282,9 @@ def main():
     else:
         # Compare only as specified by the arguments
         if args.json_baseline and args.json_new:
-            compare.compare_jsons(args.json_baseline, args.json_new)
+            compare.compare_jsons(args.json_baseline,
+                                  args.json_new,
+                                  percent_threshold=args.threshold)
         if args.summary_baseline and args.summary_new:
             compare.compare_summary_reports(args.summary_baseline, args.summary_new)