converged-computing · vsoch · May 31, 2025 · May 31, 2025 · Jul 24, 2025
diff --git a/analysis/bdas/1-run-analysis.py b/analysis/bdas/1-run-analysis.py
@@ -0,0 +1,189 @@
+#!/usr/bin/env python3
+
+import argparse
+import os
+import sys
+import re
+
+import matplotlib.pylab as plt
+import seaborn as sns
+
+here = os.path.dirname(os.path.abspath(__file__))
+analysis_root = os.path.dirname(here)
+root = os.path.dirname(analysis_root)
+sys.path.insert(0, analysis_root)
+
+import performance_study as ps
+
+sns.set_theme(style="whitegrid", palette="muted")
+
+# These are files I found erroneous - no result, or incomplete result
+# Details included with each, and more exploration is likely needed to quantify
+# error types
+errors = []
+error_regex = "(%s)" % "|".join(errors)
+
+
+def get_parser():
+    parser = argparse.ArgumentParser(
+        description="Run analysis",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    parser.add_argument(
+        "--root",
+        help="root directory with experiments",
+        default=os.path.join(root, "experiments"),
+    )
+    parser.add_argument(
+        "--non-anon",
+        help="Generate non-anon",
+        action="store_true",
+        default=False,
+    )
+    parser.add_argument(
+        "--out",
+        help="directory to save parsed results",
+        default=os.path.join(here, "data"),
+    )
+    return parser
+
+
+def main():
+    """
+    Find application result files to parse.
+    """
+    parser = get_parser()
+    args, _ = parser.parse_known_args()
+
+    # Output images and data
+    outdir = os.path.abspath(args.out)
+    indir = os.path.abspath(args.root)
+
+    # We absolutely want on premises results here
+    if not os.path.exists(outdir):
+        os.makedirs(outdir)
+
+    # Find input files (skip anything with test)
+    files = ps.find_inputs(indir, "bdas")
+    if not files:
+        raise ValueError(f"There are no input files in {indir}")
+
+    # Saves raw data to file
+    df = parse_data(indir, outdir, files)
+    plot_results(df, outdir, args.non_anon)
+
+
+
+def parse_data(indir, outdir, files):
+    """
+    Parse filepaths for environment, etc., and results files for data.
+    """
+    # metrics here will be figures of merit, and seconds runtime
+    p = ps.ProblemSizeParser("bdas")
+    data = {}
+
+    # It's important to just parse raw data once, and then use intermediate
+    for filename in files:
+        exp = ps.ExperimentNameParser(filename, indir)
+        if exp.prefix not in data:
+            data[exp.prefix] = []
+
+        # Skip size 2: testing
+        if exp.size == 2:
+            continue
+
+        # kmeans, princcomp, or svm
+        app = os.path.basename(filename).split('-')[-1].replace('.r.out', '')
+
+        # Set the parsing context for the result data frame
+        p.set_context(exp.cloud, exp.env, exp.env_type, exp.size)
+
+        # Sanity check the files we found
+        print(filename)
+        exp.show()
+
+        item = ps.read_file(filename)
+        jobs = ps.parse_flux_jobs(item)
+        for job, metadata in jobs.items():
+            print(metadata)
+            minimum, mean, maximum = [x for x in metadata['log'].split('\n')[-1].split(' ') if x.strip()]
+            p.add_result("duration", metadata['duration'], app)
+            p.add_result("minimum", minimum, app)
+            p.add_result("mean", mean, app)
+            p.add_result("maximum", maximum, app)
+
+    print("Done parsing bdas results!")
+
+    # Save stuff to file first
+    p.df.to_csv(os.path.join(outdir, "bdas-results.csv"))
+    ps.write_json(jobs, os.path.join(outdir, "flux-jobs-and-events.json"))
+    return p.df
+
+def plot_results(df, outdir, non_anon=False):
+    """
+    Plot analysis results
+    """
+    # Let's get some shoes! Err, plots.
+    # Make an image outdir
+    img_outdir = os.path.join(outdir, "img")
+    if not os.path.exists(img_outdir):
+        os.makedirs(img_outdir)
+
+    # We are going to put the plots together, and the colors need to match!
+    cloud_colors = {}
+    for cloud in df.experiment.unique():
+        cloud_colors[cloud] = ps.match_color(cloud)
+
+    # Within a setup, compare between experiments for GPU and cpu
+    frames = {}
+    for env in df.env_type.unique():
+        subset = df[df.env_type == env]
+
+        # Make a plot for seconds runtime, and each FOM set.
+        # We can look at the metric across sizes, colored by experiment
+        for metric in subset.metric.unique():
+            metric_df = subset[subset.metric == metric]
+            frames[metric] = {'cpu': metric_df}
+
+    for metric, data_frames in frames.items():
+        fig = plt.figure(figsize=(9, 3.3))
+        gs = plt.GridSpec(1, 2, width_ratios=[3, 1])
+        axes = []
+        axes.append(fig.add_subplot(gs[0, 0]))
+        axes.append(fig.add_subplot(gs[0, 1]))
+
+        sns.set_style("whitegrid")
+        sns.barplot(
+            data_frames["cpu"],
+            ax=axes[0],
+            x="nodes",
+            y="value",
+            hue="problem_size",
+            err_kws={"color": "darkred"},
+            # palette=cloud_colors,
+            order=[4, 8, 16, 32, 64],
+        )
+        title = " ".join([x.capitalize() for x in metric.split("_")])        
+        axes[0].set_title(f"BDAS {title} (CPU)", fontsize=14)
+        axes[0].set_ylabel("Seconds", fontsize=14)
+        axes[0].set_xlabel("Nodes", fontsize=14)
+        handles, labels = axes[0].get_legend_handles_labels()
+        labels = ["/".join(x.split("/")[0:2]) for x in labels]
+        axes[1].legend(
+            handles, labels, loc="center left", bbox_to_anchor=(-0.1, 0.5), frameon=False
+        )
+        for ax in axes[0:1]:
+            ax.get_legend().remove()
+        axes[1].axis("off")
+
+        plt.tight_layout()
+        plt.savefig(os.path.join(img_outdir, f"bdas-{metric}-cpu.svg"))
+        plt.savefig(os.path.join(img_outdir, f"bdas-{metric}-cpu.png"))
+        plt.clf()
+
+        # Print the total number of data points
+        print(f'Total number of CPU datum: {data_frames["cpu"].shape[0]}')
+
+
+if __name__ == "__main__":
+    main()