From aab94e154166b56e1deddb6439a19d767a56a653 Mon Sep 17 00:00:00 2001
From: Guillaume Vernieres <guillaume.vernieres@noaa.gov>
Date: Mon, 10 Mar 2025 10:48:30 -0400
Subject: [PATCH 1/3] pi chart

---
 utils/profiling/oops_app_profile.py | 72 +++++++++++++++++++++++++++++
 1 file changed, 72 insertions(+)
 create mode 100644 utils/profiling/oops_app_profile.py

diff --git a/utils/profiling/oops_app_profile.py b/utils/profiling/oops_app_profile.py
new file mode 100644
index 000000000..59456ae5a
--- /dev/null
+++ b/utils/profiling/oops_app_profile.py
@@ -0,0 +1,72 @@
+import matplotlib.pyplot as plt
+import re
+
+# Load the profiling data file
+file_path = "oops_stats.txt"
+
+# Define a regex to extract parallel timing statistics
+pattern = re.compile(r"OOPS_STATS\s+(.+?)\s+:\s+(\d+\.\d+)")
+
+# Read and parse the file
+runtimes = {}
+in_parallel_section = False
+with open(file_path, "r") as file:
+    for line in file:
+        if "---------------------------------- Parallel Timing Statistics" in line:
+            if in_parallel_section:
+                break  # Stop parsing at the end of the section
+            else:
+                in_parallel_section = True
+                continue
+
+        if in_parallel_section and "OOPS_STATS" in line:
+            print(f"-------- {line}")
+            match = pattern.search(line)
+            if match:
+                key, runtime = match.groups()
+                runtimes[key.strip()] = float(runtime) / 1000  # Convert ms to seconds
+
+# Ensure there is data to plot
+if runtimes:
+    # Sort by runtime in descending order
+    sorted_runtimes = sorted(runtimes.items(), key=lambda item: item[1], reverse=True)
+
+    # Calculate cumulative runtime and determine the cutoff for the top 90%
+    total_runtime = sum(runtime for _, runtime in sorted_runtimes)
+    cumulative_runtime = 0
+    top_runtimes = []
+    other_runtime = 0
+
+    for key, runtime in sorted_runtimes:
+        if cumulative_runtime / total_runtime < 0.95:
+            top_runtimes.append((key, runtime))
+            cumulative_runtime += runtime
+        else:
+            other_runtime += runtime
+
+    # Add the "Other" category
+    if other_runtime > 0:
+        top_runtimes.append(("Other", other_runtime))
+
+    # Prepare data for plotting
+    #print(top_runtimes)
+    top_runtimes = [(key, size) for key, size in top_runtimes if "Total" not in key and "measured" not in key]
+    labels, sizes = zip(*top_runtimes)
+    print(f"sizes: {sizes}")
+    print(f"labels: {labels}")
+
+    # Generate Pie Chart with labels on the side
+    plt.figure(figsize=(15, 10))
+    wedges, texts, autotexts = plt.pie(sizes, autopct='%1.1f%%', startangle=140)
+    for i, text in enumerate(autotexts):
+        text.set_text(f'{sizes[i]:.2f}')
+
+    # Add a legend with the labels
+    plt.legend(wedges, labels, title="Categories")
+
+    plt.title("Parallel Runtime Distribution from OOPS Profiling Data", fontsize=16, fontweight='bold')
+    plt.xlabel("Runtime (s)", fontsize=14)
+    plt.axis('equal')  # Equal aspect ratio ensures that pie is drawn as a circle.
+    plt.show()
+else:
+    print("No timing data found in the Parallel Timing Statistics section.")

From c824a1da3a7d5b5aad174f4008999c4de413c6ea Mon Sep 17 00:00:00 2001
From: Guillaume Vernieres <guillaume.vernieres@noaa.gov>
Date: Tue, 11 Mar 2025 13:16:53 -0400
Subject: [PATCH 2/3] parse yaml

---
 utils/profiling/oops_app_profile.py | 40 +++++++++++++++++++++--------
 utils/profiling/profile.yaml        | 35 +++++++++++++++++++++++++
 2 files changed, 65 insertions(+), 10 deletions(-)
 create mode 100644 utils/profiling/profile.yaml

diff --git a/utils/profiling/oops_app_profile.py b/utils/profiling/oops_app_profile.py
index 59456ae5a..958fac5f1 100644
--- a/utils/profiling/oops_app_profile.py
+++ b/utils/profiling/oops_app_profile.py
@@ -1,8 +1,20 @@
+import argparse
+import yaml
 import matplotlib.pyplot as plt
 import re
 
-# Load the profiling data file
-file_path = "oops_stats.txt"
+# Parse command-line arguments
+parser = argparse.ArgumentParser(description='Process profiling data from a YAML configuration file.')
+parser.add_argument('config', type=str, help='Path to the YAML configuration file')
+args = parser.parse_args()
+
+# Load the YAML configuration file
+with open(args.config, 'r') as yaml_file:
+    config = yaml.safe_load(yaml_file)
+
+# Extract the file path from the configuration
+file_path = config['oops log']
+methods = config['methods']
 
 # Define a regex to extract parallel timing statistics
 pattern = re.compile(r"OOPS_STATS\s+(.+?)\s+:\s+(\d+\.\d+)")
@@ -20,7 +32,6 @@
                 continue
 
         if in_parallel_section and "OOPS_STATS" in line:
-            print(f"-------- {line}")
             match = pattern.search(line)
             if match:
                 key, runtime = match.groups()
@@ -36,24 +47,33 @@
     cumulative_runtime = 0
     top_runtimes = []
     other_runtime = 0
+    # Convert sorted_runtimes to a dictionary
+    sorted_runtimes_dict = {key: runtime for key, runtime in sorted_runtimes}
+
+    # print the sorted_runtimes_dict one key/value pair per line
+    for key, value in sorted_runtimes_dict.items():
+        print(f"{key}: {value}")
+
+    total_runtime_value = sorted_runtimes_dict['util::Timers::Total']
 
     for key, runtime in sorted_runtimes:
-        if cumulative_runtime / total_runtime < 0.95:
+        if key in methods:
+            print(f"---------- key: {key}, runtime: {runtime}")
             top_runtimes.append((key, runtime))
             cumulative_runtime += runtime
-        else:
-            other_runtime += runtime
+
+    other_runtime = total_runtime_value - cumulative_runtime
+
+    print(f"Total runtime: {total_runtime_value}")
+    print(f"Top runtime: {cumulative_runtime}")
+    print(f"Other runtime: {other_runtime}")
 
     # Add the "Other" category
     if other_runtime > 0:
         top_runtimes.append(("Other", other_runtime))
 
     # Prepare data for plotting
-    #print(top_runtimes)
-    top_runtimes = [(key, size) for key, size in top_runtimes if "Total" not in key and "measured" not in key]
     labels, sizes = zip(*top_runtimes)
-    print(f"sizes: {sizes}")
-    print(f"labels: {labels}")
 
     # Generate Pie Chart with labels on the side
     plt.figure(figsize=(15, 10))
diff --git a/utils/profiling/profile.yaml b/utils/profiling/profile.yaml
new file mode 100644
index 000000000..ae3eff704
--- /dev/null
+++ b/utils/profiling/profile.yaml
@@ -0,0 +1,35 @@
+oops log: 'oops_stats.txt'
+methods:
+- oops::Covariance::SABER::multiply
+- oops::State::State
+- oops::Increment::diff
+- oops::Geometry::Geometry
+- oops::State::write
+- oops::Model::step
+- oops::State::read
+- oops::Increment::write
+- oops::ObsSpace::ObsSpace
+- oops::ObsSpace::save
+- oops::UnstructuredInterpolator::apply
+- oops::LinearVariableChange::changeVarTraj
+#- oops::Covariance::SABER::Constructor
+#- oops::Increment::Increment
+#- oops::GetValues::processTL
+#- oops::Increment::read
+#- oops::GetValues::GetValues
+#- oops::GetValues::processAD
+#- oops::LinearVariableChange::changeVarTL
+#- oops::LinearVariableChange::changeVarAD
+#- oops::Increment::operator=
+#- oops::UnstructuredInterpolator::applyAD
+#- oops::VariableChange::changeVar
+#- oops::Increment::operator+=(State, Increment)
+#- oops::Parameters::deserialize
+#- oops::GetValues::fillGeoVaLsTL
+#- oops::GetValues::process
+#- oops::ObsVector::dot_product
+#- oops::Increment::toFieldSet
+#- oops::GetValues::fillGeoVaLsAD
+#- oops::State::toFieldSet
+#- oops::Increment::fromFieldSet
+#
\ No newline at end of file

From a9d77f885ff257d0dc71384ff3f21e93d42fd3ef Mon Sep 17 00:00:00 2001
From: Ricardo Todling <ricardo.todling@nasa.gov>
Date: Wed, 26 Mar 2025 12:02:08 -0400
Subject: [PATCH 3/3] Add ability to compare timings among diff exp in bar
 plot-style

---
 utils/profiling/cmp2exp.yaml        |  49 ++++++++++
 utils/profiling/oops_app_profile.py | 145 +++++++++++++++++++++++-----
 utils/profiling/profile.yaml        |   5 +-
 3 files changed, 173 insertions(+), 26 deletions(-)
 create mode 100644 utils/profiling/cmp2exp.yaml

diff --git a/utils/profiling/cmp2exp.yaml b/utils/profiling/cmp2exp.yaml
new file mode 100644
index 000000000..21b88713b
--- /dev/null
+++ b/utils/profiling/cmp2exp.yaml
@@ -0,0 +1,49 @@
+oops log: ['exp1.log','exp2.log']
+plot type: bars
+bar attributes:
+  colors: ['b','r']
+  labels: ['Exp1','Exp2']
+  width: 0.35
+methods:
+- oops::Covariance::SABER::multiply                   
+- oops::Geometry::Geometry                            
+#- oops::GetValues::GetValues                          
+#- oops::GetValues::finalizeAD                         
+- oops::GetValues::process                            
+- oops::GetValues::processAD                          
+- oops::GetValues::processTL                          
+#- oops::Increment::Increment                          
+#- oops::Increment::axpy                               
+#- oops::Increment::dot_product_with                   
+#- oops::Increment::fromFieldSet                       
+#- oops::Increment::operator=                          
+#- oops::Increment::print                              
+- oops::Increment::write                              
+#- oops::Increment::toFieldSet                         
+#- oops::LinearObsOper::AIRS AQUA::simulateObsAD       
+#- oops::LinearObsOper::CRIS-FSR NOAA-20::setTrajectory
+#- oops::LinearObsOper::CRIS-FSR NOAA-20::simulateObsAD
+#- oops::LinearObsOper::CRIS-FSR NPP::setTrajectory    
+#- oops::LinearObsOper::CRIS-FSR NPP::simulateObsAD    
+#- oops::LinearObsOper::IASI METOP-B::setTrajectory    
+#- oops::LinearObsOper::IASI METOP-B::simulateObsAD    
+#- oops::LinearObsOper::IASI METOP-C::setTrajectory    
+#- oops::LinearObsOper::IASI METOP-C::simulateObsAD    
+#- oops::LinearObsOper::ssmis_f17::simulateObsAD       
+#- oops::LinearVariableChange::changeVarAD             
+#- oops::LinearVariableChange::changeVarTL             
+#- oops::ObsAuxControl::ObsAuxControl                  
+#- oops::ObsDataVector::print                          
+#- oops::ObsOperator::AIRS AQUA::simulateObs           
+#- oops::ObsOperator::CRIS-FSR NOAA-20::simulateObs    
+#- oops::ObsOperator::CRIS-FSR NPP::simulateObs        
+#- oops::ObsOperator::IASI METOP-B::simulateObs        
+#- oops::ObsOperator::IASI METOP-C::simulateObs        
+- oops::ObsSpace::ObsSpace                            
+- oops::ObsSpace::save                                
+- oops::State::State                                  
+#- oops::State::print                                  
+#- oops::State::write                                  
+- oops::UnstructuredInterpolator::apply               
+- oops::UnstructuredInterpolator::applyAD             
+#- oops::VariableChange::changeVar                     
diff --git a/utils/profiling/oops_app_profile.py b/utils/profiling/oops_app_profile.py
index 958fac5f1..4f7485a9a 100644
--- a/utils/profiling/oops_app_profile.py
+++ b/utils/profiling/oops_app_profile.py
@@ -1,28 +1,20 @@
+#!/usr/bin/env python3
+
 import argparse
 import yaml
 import matplotlib.pyplot as plt
 import re
+import numpy as np
 
-# Parse command-line arguments
-parser = argparse.ArgumentParser(description='Process profiling data from a YAML configuration file.')
-parser.add_argument('config', type=str, help='Path to the YAML configuration file')
-args = parser.parse_args()
+def read_timers(file_path):
 
-# Load the YAML configuration file
-with open(args.config, 'r') as yaml_file:
-    config = yaml.safe_load(yaml_file)
+  # Define a regex to extract parallel timing statistics
+  pattern = re.compile(r"OOPS_STATS\s+(.+?)\s+:\s+(\d+\.\d+)")
 
-# Extract the file path from the configuration
-file_path = config['oops log']
-methods = config['methods']
-
-# Define a regex to extract parallel timing statistics
-pattern = re.compile(r"OOPS_STATS\s+(.+?)\s+:\s+(\d+\.\d+)")
-
-# Read and parse the file
-runtimes = {}
-in_parallel_section = False
-with open(file_path, "r") as file:
+  # Read and parse the file
+  runtimes = {}
+  in_parallel_section = False
+  with open(file_path, "r") as file:
     for line in file:
         if "---------------------------------- Parallel Timing Statistics" in line:
             if in_parallel_section:
@@ -37,9 +29,18 @@
                 key, runtime = match.groups()
                 runtimes[key.strip()] = float(runtime) / 1000  # Convert ms to seconds
 
-# Ensure there is data to plot
-if runtimes:
+  return runtimes
+
+def makepie(runtimes,methods):
+
+  # Ensure there is data to plot
+  if runtimes:
     # Sort by runtime in descending order
+#   if nosort==True:
+#      print ("not being sorted")
+#      sorted_runtimes = runtimes.items()
+#   else:
+#      sorted_runtimes = sorted(runtimes.items(), key=lambda item: item[1], reverse=True)
     sorted_runtimes = sorted(runtimes.items(), key=lambda item: item[1], reverse=True)
 
     # Calculate cumulative runtime and determine the cutoff for the top 90%
@@ -75,18 +76,114 @@
     # Prepare data for plotting
     labels, sizes = zip(*top_runtimes)
 
-    # Generate Pie Chart with labels on the side
+    # Set figure dimensions
     plt.figure(figsize=(15, 10))
+   
+    # Generate Pie Chart with labels on the side
     wedges, texts, autotexts = plt.pie(sizes, autopct='%1.1f%%', startangle=140)
     for i, text in enumerate(autotexts):
         text.set_text(f'{sizes[i]:.2f}')
+        if labels[i] == "Other":
+           wedges[i].set_alpha(0.5)
 
     # Add a legend with the labels
     plt.legend(wedges, labels, title="Categories")
+    plt.axis('equal')  # Equal aspect ratio ensures that pie is drawn as a circle.
 
     plt.title("Parallel Runtime Distribution from OOPS Profiling Data", fontsize=16, fontweight='bold')
     plt.xlabel("Runtime (s)", fontsize=14)
-    plt.axis('equal')  # Equal aspect ratio ensures that pie is drawn as a circle.
-    plt.show()
+  else:
+      print("No timing data found in the Parallel Timing Statistics section.")
+
+def makebars(runtimes,methods,ax,width,offset,color,case):
+
+  # Ensure there is data to plot
+  if runtimes:
+    # Sort by runtime in descending order
+    sorted_runtimes = runtimes.items()
+
+    # Calculate cumulative runtime and determine the cutoff for the top 90%
+    total_runtime = sum(runtime for _, runtime in sorted_runtimes)
+    cumulative_runtime = 0
+    top_runtimes = []
+    other_runtime = 0
+    # Convert sorted_runtimes to a dictionary
+    sorted_runtimes_dict = {key: runtime for key, runtime in sorted_runtimes}
+
+    # print the sorted_runtimes_dict one key/value pair per line
+    for key, value in sorted_runtimes_dict.items():
+        print(f"{key}: {value}")
+
+    total_runtime_value = sorted_runtimes_dict['util::Timers::Total']
+
+    for key, runtime in sorted_runtimes:
+        if key in methods:
+            print(f"---------- key: {key}, runtime: {runtime}")
+            top_runtimes.append((key, runtime))
+            cumulative_runtime += runtime
+
+    other_runtime = total_runtime_value - cumulative_runtime
+
+    print(f"Total runtime: {total_runtime_value}")
+    print(f"Top runtime: {cumulative_runtime}")
+    print(f"Other runtime: {other_runtime}")
+
+    # Add the "Other" category
+    if other_runtime > 0:
+        top_runtimes.append(("Other", other_runtime))
+
+    # Prepare data for plotting
+    labels, sizes = zip(*top_runtimes)
+
+    # Generate Pie Chart with labels on the side
+    ind = np.arange(len(labels))
+    bars = ax.barh(ind+offset,sizes,width,color=color,label=case+f': {total_runtime_value:.1f}s')
+
+    ax.set(yticks=ind+offset, yticklabels=labels, ylim=[2*width - 1, len(labels)])
+    ax.legend()
+    ax.set_title("Parallel Runtime Distribution from OOPS Profiling Data", fontsize=16, fontweight='bold')
+    ax.set_xlabel("Runtime (s)", fontsize=14)
+
+    # annotate bars with percentage times
+    for i, this in enumerate(top_runtimes):
+       p = 100 * this[1] / total_runtime_value
+       ax.text(this[1] + 0.005*total_runtime_value, i+offset, f'{p:.1f}%\n', 
+               color=color, fontweight='bold', fontsize=8, ha='left', va='top')
+  else:
+      print("No timing data found in the Parallel Timing Statistics section.")
+
+# Parse command-line arguments
+parser = argparse.ArgumentParser(description='Process profiling data from a YAML configuration file.')
+parser.add_argument('config', type=str, help='Path to the YAML configuration file')
+args = parser.parse_args()
+
+# Load the YAML configuration file
+with open(args.config, 'r') as yaml_file:
+    config = yaml.safe_load(yaml_file)
+
+# Extract the file path from the configuration
+file_path = config['oops log']
+methods = config['methods']
+plt_type = config['plot type']
+
+if plt_type == 'pie':
+  # make pie chart
+  for file in file_path:
+    runtimes = read_timers(file)
+    makepie(runtimes,methods)
+
 else:
-    print("No timing data found in the Parallel Timing Statistics section.")
+  # read relevant additional attributes
+  # make bar plots
+  colors = config['bar attributes']['colors']
+  labels = config['bar attributes']['labels']
+  width =  config['bar attributes']['width']
+  fig, ax = plt.subplots(figsize=(12, 8), gridspec_kw={'width_ratios': [2], 'height_ratios': [1]})
+  for i, file in enumerate(file_path):
+    runtimes = read_timers(file)
+    offset = i*width
+    makebars(runtimes,methods,ax,width,offset,colors[i],labels[i])
+  plt.subplots_adjust(left=0.3) # labels tend to be long
+
+plt.show()
+
diff --git a/utils/profiling/profile.yaml b/utils/profiling/profile.yaml
index ae3eff704..dd68a49ed 100644
--- a/utils/profiling/profile.yaml
+++ b/utils/profiling/profile.yaml
@@ -1,4 +1,5 @@
-oops log: 'oops_stats.txt'
+oops log: ['oops_stats.txt']
+plot type: pie
 methods:
 - oops::Covariance::SABER::multiply
 - oops::State::State
@@ -32,4 +33,4 @@ methods:
 #- oops::GetValues::fillGeoVaLsAD
 #- oops::State::toFieldSet
 #- oops::Increment::fromFieldSet
-#
\ No newline at end of file
+#