ufs-community · gspetro-NOAA · Sep 18, 2025 · Sep 19, 2025 · Sep 19, 2025 · Sep 18, 2025
diff --git a/.github/scripts/__init__.py b/.github/scripts/__init__.py
diff --git a/.github/scripts/get_data.py b/.github/scripts/get_data.py
@@ -0,0 +1,259 @@
+import requests
+import os
+import json
+from datetime import datetime
+import re
+import numpy as np
+import logging
+
+class APICall():
+   """A GitHub API call"""
+
+   def __init__(self, endpoint='', num_commits=1):
+      self.token = os.environ.get('GITHUB_TOKEN')
+      self.base_url = os.environ.get('BASE_URL')
+      self.endpoint = endpoint
+      self.url = f"{self.base_url}/{self.endpoint}" #Could use a path join?
+      self.num_commits = num_commits
+      self.header = {
+         "Accept": "application/vnd.github.v3+json",
+         "Authorization": f"Bearer {self.token}",
+         "X-GitHub-Api-Version": "2022-11-28",
+         "Accept": "application/vnd.github.raw"
+      }
+
+class Log():
+   """A Regression Test log file."""
+
+   def __init__(self, machine):
+      """Create the log file object for a specific machine."""
+      self.machine = machine.lower()
+      self.text_per_log = []
+
+   def call_API(self, endpoint):
+      """Call the GitHub API to get information about the log file."""
+
+      api_call = APICall(endpoint)
+      response = requests.get(api_call.url, headers=api_call.header)
+      response = json.loads(response.text)
+
+      return response
+
+   def _get_pr_head(self):
+      """Get SHA for the HEAD of the PR. Structure of response: 
+         response = [{"head": {"sha": "a1b2c3d..."}}]
+         See GitHub documentation for https://docs.github.com/en/rest/commits/commits?apiVersion=2022-11-28#list-commits
+      """
+      response = self.call_API(f"pulls/{os.environ.get('PR_NUM')}")
+      self.pr_head_commit = [response['head']['sha']]
+
+   def _fetch_repo_commits(self, num_commits=1):
+      """Get a list of commits for the log file from the authoritative repository, with a maximum of 100 and a default of 1. 
+      Structure of response: response = [{'sha': '3jl26ka...'}, {'sha': '6ag43sb...'}, ...]
+      See GitHub documentation for https://docs.github.com/en/rest/commits/commits?apiVersion=2022-11-28#list-commits
+      """
+      response = self.call_API(f"commits?path=tests/logs/RegressionTests_{self.machine}.log&per_page={num_commits}")
+
+      self.repo_commits = []
+      for num in range(len(response)): 
+         try: 
+            self.repo_commits.append(response[num]['sha'])
+         except: 
+            logging.error(f"API Call failed. The sha does not exist!")
+
+   def _fetch_log_text(self, commits): 
+      """For each commit of a log, extract the log text."""
+
+      try:
+         api_call = APICall(f"contents/tests/logs/RegressionTests_{self.machine}.log")
+
+         for num in range(len(commits)): 
+            url = api_call.url + (f"?ref={commits[num]}") #Could use a path join?
+            r = requests.get(url, headers=api_call.header)
+            if commits == self.pr_head_commit:
+               # Ensure that the pr log text comes first
+               self.text_per_log.insert(0,r.text)
+            else:
+               self.text_per_log.append(r.text)
+      except:
+         logging.error("An appropriate commit(s) was not provided. Call _get_pr_head() or _fetch_repo_commits() first.")
+
+   def _get_instance_test_data(self, log_instance):
+      """For each instance of a log at a given commit, extract runtime and memory data from the log text
+         Args:
+            log_instance: Log text for a given commit
+         Returns: 
+            tests_for_log_instance: A dictionary of tests (keys) with an array of total runtime and memory use as the value for each test
+      """
+
+      tests_for_log_instance = {}
+
+      pattern = r"TEST \'(.*)\' \[\d+:\d+, (\d+):(\d+)\]\((\d+) MB\)"
+      log_instance = log_instance.splitlines()
+
+      for line in log_instance:
+         test_match = re.search(pattern, line)
+         if test_match:
+            test_name, hh, mm, mem = test_match.groups()
+            total_minutes = int(hh) * 60 + int(mm)
+            tests_for_log_instance[test_name] = [total_minutes, int(mem)]
+
+      return tests_for_log_instance     
+
+   def _compile_historical_log_data(self): # Could split for runtime, mem to make more maintainable
+      """Create a dictionary of data with runtime and memory usage for each test over time. Structure:  
+         historical_test_data = {
+            test: {runtime: [], memory: []}
+         }
+      """
+
+      self.historical_rt_mem_data = {}
+
+      # Skip self.text_per_log[0] because it is the log from the PR
+      for log_instance in self.text_per_log[1:]:
+
+         data = self._get_instance_test_data(log_instance)
+         for test in data:
+            try: 
+               self.historical_rt_mem_data[test]["runtime"].append(data[test][0])
+               self.historical_rt_mem_data[test]["memory"].append(data[test][1])
+            except KeyError: 
+               logging.info("Test key doesn't exist yet. Creating test key.")
+               self.historical_rt_mem_data[test] = {"runtime": [data[test][0]], "memory": [data[test][1]]}
+
+   def calculate_stats(self):
+      """For each test, calculate the mean and standard deviation of memory and runtime.
+      """
+      self.test_stats = {}
+      for test in self.historical_rt_mem_data:
+         runtime_mean = round(np.mean(self.historical_rt_mem_data[test]["runtime"]), 5)
+         runtime_stdev = round(np.std(self.historical_rt_mem_data[test]["runtime"]), 5)
+         memory_mean = round(np.mean(self.historical_rt_mem_data[test]["memory"]), 5)
+         memory_stdev = round(np.std(self.historical_rt_mem_data[test]["memory"]), 5)
+         self.test_stats[test] = [runtime_mean, runtime_stdev, memory_mean, memory_stdev]
+
+   def _compare_runtime(self, current_log, previous_logs):
+      """Determine whether the test runtime is within normal bounds."""
+
+      self.runtime_results = {}
+
+      for test in current_log:
+         try:
+            hi_rt = self.test_stats[test][0] + self.test_stats[test][1]
+            if current_log[test][0] > hi_rt and previous_logs['last'][test][0] > hi_rt and previous_logs['second_to_last'][test][0] > hi_rt:
+               self.runtime_results[test] = '❌'
+            elif current_log[test][0] > hi_rt:
+               self.runtime_results[test] = '⚠️'
+            else:
+               self.runtime_results[test] = '✅'
+         except KeyError:
+            logging.info(f"{test} is new. No comparison data.")
+            self.runtime_results[test] = 'New'
+
+   def _compare_memory(self, current_log, previous_logs):
+      """Determine whether the test memory usage is within normal bounds."""
+
+      self.memory_results = {}
+
+      for test in current_log:
+         try:
+            hi_mem = self.test_stats[test][2] + self.test_stats[test][3]
+            if current_log[test][1] > hi_mem and previous_logs['last'][test][1] > hi_mem and previous_logs['second_to_last'][test][1] > hi_mem:
+               self.memory_results[test] = '❌'
+            elif current_log[test][1] > hi_mem:
+               self.memory_results[test] = '⚠️'
+            else:
+               self.memory_results[test] = '✅'
+         except KeyError:
+            logging.info(f"{test} is new. No comparison data.")
+            self.memory_results[test] = 'New'
+
+   def compare_results(self): 
+      """Check results from previous two commits to determine whether the test runtime/memory usage is within normal bounds."""
+
+      current_log = self._get_instance_test_data(self.text_per_log[0])
+      previous_logs = {"last" : {}, "second_to_last" : {}}
+
+      for index, item in enumerate(previous_logs):
+         previous_logs[item] = self._get_instance_test_data(self.text_per_log[index + 1])
+
+      self._compare_runtime(current_log, previous_logs)
+      self._compare_memory(current_log, previous_logs)
+
+   def get_current_pr_data(self):
+      """Extract runtime/memory data for the PR's most recent commit."""
+
+      self._get_pr_head()
+      self._fetch_log_text(self.pr_head_commit)
+      pr_log_data = self._get_instance_test_data(self.text_per_log[0])
+
+      return pr_log_data
+
+   def gather_historical_data(self, num_commits=2):
+      """Extract runtime/memory data for the authoritative repository's last two commits."""
+      self._fetch_repo_commits(num_commits) #increase for statistical significance
+      self._fetch_log_text(self.repo_commits)
+      self._compile_historical_log_data()
+
+"""Utilities for file I/O"""
+
+def create_json(dictionary, file_name):
+   """Create a json file with statistics for each test on each machine"""
+
+   with open(f"data/{file_name}.json", 'w') as fh:
+      json.dump(dictionary, fh, indent=4)
+
+def load_json(file_path):
+   """Convert JSON file to python dictionary."""
+   with open(file_path, 'r', encoding='utf-8') as file:
+      data = json.load(file)
+
+   return data
+
+def main():
+   """For each machine, create a log object, get current PR data, gather historical runtime/memory data, 
+   and compare results to determine which test/machine combinations fall more than 2 standard deviations 
+   above the historical mean for each test.""" 
+
+   machines = os.environ.get('MACHINES').split()
+
+   # Contains mean and standard deviation for each test on each machine
+   stats_by_machine = {}
+   # Contains information on whether test runtime was more than 2 standard deviations above the mean. 
+   runtime_results_by_machine = {}
+   # Contains information on whether test memory was more than 2 standard deviations above the mean. 
+   mem_results_by_machine = {}
+
+   for machine in machines:
+      print(machine.upper())
+      log = Log(machine)
+      log.get_current_pr_data()
+      # Case where test stats have been calculated and cached:
+      if os.environ.get('TEST_STATS'):
+         log.gather_historical_data(2) # past two commits only
+         log.test_stats = load_json(os.environ.get('TEST_STATS'))[machine]
+
+      # Case where test stats have NOT been calculated and cached:
+      else:
+         log.gather_historical_data(50) # past 50 commits
+         log.calculate_stats()
+         stats_by_machine[machine] = log.test_stats # Add stats to save/cache later
+
+      # Compare and save results
+      log.compare_results()
+      runtime_results_by_machine[machine] = log.runtime_results
+      mem_results_by_machine[machine] = log.memory_results
+
+   # If the statistics on mean/standard deviation have NOT already been cached, create file to cache.
+   if not os.environ.get('TEST_STATS'):
+      create_json(stats_by_machine, "stats")
+
+   # Create resource summaries to use in write_test_summary.py 
+   create_json(runtime_results_by_machine, "runtime_results")
+   create_json(mem_results_by_machine, "memory_results")
+
+   return 0
+
+if __name__ == "__main__": # pragma: no coverage
+
+   main()
diff --git a/.github/scripts/write_test_summary.py b/.github/scripts/write_test_summary.py
@@ -0,0 +1,136 @@
+import os
+import json
+import re
+from mdutils.mdutils import MdUtils
+import pandas as pd
+
+def load_json(file_path):
+   """Convert JSON file to python dictionary."""
+   with open(file_path, 'r', encoding='utf-8') as file:
+      data = json.load(file)
+
+   return data
+
+def create_mdFile():
+   """Create a markdown file named summary.md with the PR# in the title."""
+   pr_num = os.environ.get('PR_NUM')
+   mdFile = MdUtils(file_name='summary.md', title=f'Test Summary for PR #{pr_num}')
+
+   return mdFile
+
+def build_content(category):
+   """Load the runtime or memory results dictionary, convert to dataframe, and return the results
+   Args: 
+      category (str): "runtime" or "memory"
+   Returns:
+      results: DataFrame containing the runtime/memory testing results. Rows are tests and columns are machines.
+   """
+
+   contents = load_json(os.environ.get(f"{category.upper()}_RESULTS"))
+   results = pd.DataFrame()
+
+   for machine in contents:
+
+      machine_results = pd.DataFrame.from_dict(contents[machine], orient='index', columns=[machine])
+      results = pd.merge(results, machine_results, left_index=True, right_index=True, how='outer').fillna("N/A")
+
+   results = _count_passes_per_test(results)
+   results = pd.concat([results, _count_passes_per_machine(results)])
+
+   return results
+
+def write_content(data, mdFile):
+
+   machines = os.environ.get('MACHINES').split()
+
+   # Create contents list starting with header row
+   contents = ["Test"] + machines + ["Passing"]
+
+   # Create table starting with one row (header)
+   rows = 1
+   for index, row in data.iterrows():
+      warn = '⚠️'
+      fail = '❌'
+      # If there is a warn or fail in the row, add the row to contents to be printed; also add summary row
+      if (data.loc[index] == warn).any() or (data.loc[index] == fail).any() or (index == 'Platform Total (Passing):'):
+         rows += 1
+         contents.append(str(index))
+         for item in row:
+            contents.append(item)
+
+   mdFile.new_table(columns=(len(machines) + 2), rows=rows, text_align='center', text=contents)
+   mdFile.new_paragraph('\n')
+   mdFile.write('</details>')
+
+   return mdFile
+
+def _count_passes_per_machine(data):
+   """Counts number of passing tests on each machine and procudes a row with the totals.
+   Args:
+      data(DataFrame): Table of tests and pass/warn/fail status by machine
+   Returns:
+      machine_total(DataFrame): Number of tests passing per machine
+   """
+
+   # Counts for passing tests
+   passing_tests_by_machine = data.eq('✅').sum(axis=0).astype(str) + '/' + data.ne('N/A').sum(axis=0).astype(str)
+   for machine in passing_tests_by_machine.index:
+      passing_tests_by_machine[machine] = f"**{machine.upper()}:** " + passing_tests_by_machine[machine] + " passing"
+   passing_tests_by_machine.name = 'Platform Total (Passing):'
+   # Set bottom right corner to empty string
+   passing_tests_by_machine.loc['Passing'] = ''
+   machine_total = pd.DataFrame(passing_tests_by_machine).T
+
+   return machine_total
+
+def _count_passes_per_test(data):
+   """Counts number of platforms on which a given test passes and adds a column to the table.
+   Args:
+      data (DataFrame): DataFrame containing pass/warn/fail status for each test on each machine
+   Returns:
+      data: with an extra column listing pass rates for each test 
+   """
+
+   passing_tests = data.eq('✅').sum(axis=1).astype(str) + "/" + data.ne('N/A').sum(axis=1).astype(str)
+   passing_tests.name = 'Passing'
+   data = pd.merge(data, pd.DataFrame(passing_tests), left_index=True, right_index=True, how='inner')
+
+   return data
+
+def create_summary(categories):
+   """Append a runtime or memory header and key and call write_contents() to write the runtime/memory table to the file.
+   Args:
+      categories (list): Test categories. Currently 'runtime' and 'memory'.
+   Returns:
+      mdFile: A markdown file
+   """
+
+   mdFile = create_mdFile()
+
+   for category in categories: 
+      # Create <details> section
+      mdFile.write(f"<details><summary><h3>{category.upper()} Results Summary</h3></summary>")
+      mdFile.new_paragraph('\n')
+      # Add key to section
+      mdFile.new_paragraph("<h4>Key:</h4>")
+      mdFile.new_paragraph(f"&nbsp;&nbsp;&nbsp;&nbsp;✅ = NORMAL {category}: {category.title()} falls within two standard deviations of the mean.")
+      mdFile.new_paragraph(f"&nbsp;&nbsp;&nbsp;&nbsp;⚠️ = {category.title()} WARNING: {category.title()} is greater than two standard deviations above the mean.")
+      mdFile.new_paragraph(f"&nbsp;&nbsp;&nbsp;&nbsp;❌ = {category.title()} FAIL: For the past 2+ PRs, {category} has been greater than two standard deviations above the mean.")
+      mdFile.new_paragraph(f"&nbsp;&nbsp;&nbsp;&nbsp;N/A = Test does not run on this machine.")
+      mdFile.new_paragraph('\n')
+      # Create a DataFrame w/the runtime/memory results content
+      data = build_content(category)
+
+      # Write the content to a file
+      mdFile = write_content(data, mdFile)
+
+   return mdFile
+
+def main(): # pragma: no cover
+
+   summary = create_summary(['runtime', 'memory'])
+   print(summary.get_md_text())
+
+if __name__ == "__main__": # pragma: no cover
+
+   main()
diff --git a/.github/tests/__init__.py b/.github/tests/__init__.py