Add helpers for mpiP

2023-07-26 17:24:42 +02:00 · 2023-07-26 17:24:42 +02:00 · d201363569
commit d201363569
parent 1b6199fd9d
3 changed files with 249 additions and 1 deletions
--- a/README.md
+++ b/README.md
@ -3,4 +3,6 @@
 Collection of private utilities and scripts for Hawk.

 - monitoring: scripts related to power monitoring
-
+- performance: scripts, configs, etc. related to performance tools
+  - this can be relocated into a `/opt/hlrs/non-spack/revXX` directory  
+  
--- a/performance/mpiP/share/mpip2POP.py
+++ b/performance/mpiP/share/mpip2POP.py
@ -0,0 +1,237 @@
+#!/usr/bin/env python3
+import sys
+import re
+from operator import itemgetter
+import logging
+
+logging.basicConfig(stream=sys.stderr, level=logging.ERROR)
+
+
+def get_Nranks(fn): 
+    import subprocess
+
+    cmd = "grep '^@ MPI Task Assignment' %s | sed -n '$='" % (fn,)
+    result = subprocess.run(cmd, shell=True, stdout=subprocess.PIPE)
+    try:
+        nranks = int(result.stdout)
+    except ValueError:
+        logging.info("Cannot infer nranks from MPI Task Assignments.")
+        nranks = None
+
+    return {"ranks": nranks}
+
+def get_times(fn):
+    logging.debug("Getting times from %s" % fn)
+    import re
+    start_time_stats = re.compile("^@-+ Task Time Statistics")
+    separator = re.compile("^-")
+    header = re.compile(".*AppTime")
+    maxline = re.compile("^Max ")
+    meanline = re.compile("^Mean\s+([\.\d]+)\s+([\.\d]+)")
+    minline = re.compile("^Min\s+([\.\d]+)\s+([\.\d]+)")
+    stdline = re.compile("^Stddev ")
+    aggrline = re.compile("^Aggregate\s+([\.\d]+)\s+([\.\d]+)")
+
+    times = dict()
+
+    with open(fn) as stream:
+        # find start of time statistcs
+        line = stream.readline()
+        while line:
+            if start_time_stats.match(line):
+                break
+            line = stream.readline()
+        logging.debug("Done start ")
+
+        # expect separator
+        line = stream.readline()
+        if not separator.match(line):
+            logging.error("Failed to parse expected separator.")
+            return times
+        logging.debug("Done separator")
+
+        # expect header
+        line = stream.readline()
+        if not header.match(line):
+            logging.error("Failed to parse expected header.")
+            return times
+        logging.debug("Done header")
+
+        # expect Max line
+        line = stream.readline()
+        if not maxline.match(line):
+            logging.error("Failed to parse expected Max line.")
+            return times
+        
+        # expect and parse Mean line
+        line = stream.readline()
+        m = meanline.match(line)
+        if not m:
+            logging.error("Failed to parse expected Mean line.")
+            return times
+        avg_app = float(m.group(1))
+        avg_mpi = float(m.group(2))
+
+        # expect and parse Min line
+        line = stream.readline()
+        m = minline.match(line)
+        if not m:
+            logging.error("Failed to parse expected Min line.")
+            return times
+        min_mpi = float(m.group(2))     
+
+        # expect Stddev line
+        line = stream.readline()
+        if not stdline.match(line):
+            logging.error("Failed to parse expected Stddev line.")
+            return times
+        
+        # expect and parse Aggregate line
+        line = stream.readline()
+        m = aggrline.match(line)
+        if not m:
+            logging.error("Failed to parse expected Aggregate line.")
+            return times
+        aggr_app = float(m.group(1))
+        logging.debug("Done times")
+
+        elapsed = avg_app
+        times["elapsed"] = elapsed
+        times["avg useful"] = elapsed - avg_mpi
+        times["max useful"] = elapsed - min_mpi
+        times["ranks_alt"] = round(aggr_app/avg_app)
+
+        return times
+
+
+def efficiencies(fn):
+    metrics = dict()
+
+    metrics.update(get_Nranks(fn))
+    metrics.update(get_times(fn))
+
+    if metrics["ranks"] == None:
+        metrics["ranks"] = metrics["ranks_alt"]
+
+    metrics["PE"] = metrics["avg useful"]/metrics["elapsed"]
+    metrics["LB"] = metrics["avg useful"]/metrics["max useful"]
+    metrics["CE"] = metrics["max useful"]/metrics["elapsed"]
+
+    return metrics
+
+def scalabilities(metrics, strong=None):
+    if strong == None:
+        # Try to determine scaling type. For now assume weak
+        strong = False
+
+    ref = metrics[0]
+
+    nranks_ref = ref["ranks"]
+    useful_ref = ref["avg useful"]
+    
+    for m in metrics: 
+        scal = useful_ref/m["avg useful"]
+        if strong:
+            scal *= nranks_ref/m["ranks"]
+        m["CScal"] = scal
+        m["GE"] = m["PE"]*scal
+    
+    return metrics
+
+def dump(metrics, stream=sys.stdout, sep=",", keys=None):
+    if not keys:
+        keys = [
+            "ranks",
+            "elapsed", "avg useful", "max useful", 
+            "GE", "PE", "LB", "CE", "CScal"
+        ]
+    
+    header = "# " + sep.join(keys) + "\n"
+    stream.write(header)
+
+    for m in metrics:
+        line = sep.join([str(m[key]) for key in keys]) + "\n"
+        stream.write(line)
+        
+
+def pretty_print(metrics, stream=sys.stdout):
+    descriptions = {
+        "GE":         " GE             ",
+        "PE":         "   PE           ",
+        "LB":         "     LB         ",
+        "CE":         "     CE         ",
+        "TrE":        "       TrE      ",
+        "SerR":       "       SerE     ",
+        "CScal":      "   CScal        ",
+        "elapsed":    " Elapsed time   ",
+        "avg useful": " Average useful ",
+        "max useful": " Max useful     "
+    }
+    eff_keys = ["GE", "PE", "LB", "CE"]
+    scal_keys = ["CScal"]
+    other_keys = ["elapsed", "avg useful", "max useful"]
+    separator = "|"
+
+    width_desc = len(descriptions["GE"])
+    width_col = 7
+    width_separator = len(separator)
+
+    ncols = len(metrics)
+    skip = "-" * (width_desc + (width_separator+width_col)*ncols + width_separator)
+    
+    table = ""
+
+    table += skip + "\n"
+
+    table += " " * width_desc + separator
+    for col in metrics:
+        table += f'{col["ranks"]:^{width_col}d}' + separator
+    table += "\n"
+    table += skip + "\n"
+
+    for key in eff_keys:
+        line = descriptions[key] + separator
+        for col in metrics:
+            line +=  f'{col[key]:^{width_col}.2f}' + separator
+        table += line + "\n"
+    for key in scal_keys:
+        line = descriptions[key] + separator
+        for col in metrics:
+            line +=  f'{col[key]:^{width_col}.2f}' + separator
+        table += line + "\n" 
+    table += skip + "\n"
+
+    for key in other_keys:
+        line = descriptions[key] + separator
+        for col in metrics:
+            line +=  f'{col[key]:^{width_col}.2g}' + separator
+        table += line + "\n" 
+    table += skip + "\n"    
+
+    stream.write(table)
+
+
+
+
+
+def main():
+    filenames = sys.argv[1:]
+
+    metrics = list()
+
+    # compute parallel efficiencies for each input
+    for fn in filenames:
+        print("Processing file %s" % fn)
+        metrics.append(efficiencies(fn))
+
+    # sort metrics by ranks
+    metrics.sort(key=itemgetter('ranks'))
+
+    # compute scalabilities
+    metrics = scalabilities(metrics)
+
+    dump(metrics)
+    pretty_print(metrics)
+
+if __name__ == "__main__":
+    main()
--- a/performance/mpiP/share/trace_mpiP.sh
+++ b/performance/mpiP/share/trace_mpiP.sh
@ -0,0 +1,9 @@
+#!/bin/bash
+
+# default mpiP config 
+DEFAULT_MPIP="-c -d"
+
+# set mpiP config to default if not provided by user
+MPIP=${MPIP:-$DEFAULT_MPIP}
+export MPIP
+env LD_PRELOAD=libmpiP.so $@