Merge pull request #49088 from gartung/gartung-PerTools-AllocMonitorCircles

cmsbuild · web-flow · commit 1903dbf6533f · 2025-10-09T22:58:27.000+02:00
PerfTools/AllocMonitor: Update edmModuleAllocJsonToCircles.py to add "event setup" transition for ESProducers
diff --git a/PerfTools/AllocMonitor/scripts/edmModuleAllocJsonToCircles.py b/PerfTools/AllocMonitor/scripts/edmModuleAllocJsonToCircles.py
@@ -1,5 +1,15 @@
 #!/usr/bin/env python3
 import json
+import sys
+from collections import namedtuple
+
+# Constants
+BYTES_TO_KB = 1024
+EVENTSETUP_TRANSITION = "event setup"
+
+# Named tuple for unique module identification
+UniqueKey = namedtuple('UniqueKey', ['moduleLabel', 'moduleType', 'recordName'])
+
 transitionTypes = [
     "construction",
     "begin job",
@@ -9,15 +19,62 @@
     "global begin luminosity block",
     "stream begin luminosity block",
     "event",
+    EVENTSETUP_TRANSITION,
 ]
 allocTypes = ["added", "nAlloc", "nDealloc", "maxTemp", "max1Alloc"]
 
 def processModuleTransition(moduleLabel, moduleType, moduleInfo, transitionType, moduleTransition):
-        moduleTransition[moduleLabel] = {"cpptype": moduleType, "allocs": []}
-        for entry in moduleInfo:
-            if entry["transition"] == transitionType:
-                moduleTransition[moduleLabel]["allocs"].append(entry.get("alloc",{}))
-        moduleTransition[moduleLabel]["nTransitions"] = len(moduleTransition[moduleLabel]["allocs"])
+    """
+    Processes module transitions for a given transition type.
+
+    The expected schema for each 'alloc' dictionary is:
+        {
+            "added": int,        # Bytes added during transition
+            "nAlloc": int,       # Number of allocations
+            "nDealloc": int,     # Number of deallocations
+            "maxTemp": int,      # Maximum temporary memory (bytes)
+            "max1Alloc": int     # Largest single allocation (bytes)
+        }
+    Any missing field defaults to 0.
+
+    Note: Entries with record names are excluded as they belong to EventSetup transition only.
+    """
+    moduleKey = UniqueKey(moduleLabel, moduleType, "")
+    moduleTransition[moduleKey] = {"cpptype": moduleType, "allocs": []}
+    for entry in moduleInfo:
+        # Only process entries that match the transition type AND don't have record names
+        # (entries with record names are EventSetup only)
+        if (entry.get("transition", None) == transitionType and
+            not ("record" in entry and "name" in entry["record"])):
+            moduleTransition[moduleKey]["allocs"].append(entry.get("alloc", {}))
+    moduleTransition[moduleKey]["nTransitions"] = len(moduleTransition[moduleKey]["allocs"])
+
+def processESModuleTransition(moduleLabel, moduleType, moduleInfo, moduleTransition):
+    """Process EventSetup transitions - entries with record names
+
+    Creates unique entries for each module+type+record combination.
+    """
+    # Group allocations by record name
+    recordAllocations = {}
+    for entry in moduleInfo:
+        # EventSetup entries are those with a "record" field containing "name"
+        if "record" in entry and "name" in entry["record"]:
+            recordName = entry["record"]["name"]
+            if recordName not in recordAllocations:
+                recordAllocations[recordName] = []
+            recordAllocations[recordName].append(entry.get("alloc", {}))
+
+    # Create separate entries for each record
+    for recordName, allocs in recordAllocations.items():
+        # Create unique key: module + type + record
+        uniqueKey = UniqueKey(moduleLabel, moduleType, recordName)
+        moduleTransition[uniqueKey] = {
+            "cpptype": moduleType,
+            "allocs": allocs,
+            "nTransitions": len(allocs),
+            "moduleLabel": moduleLabel,
+            "recordName": recordName
+        }
 
 def formatToCircles(moduleTransitions):
     modules_dict = {}
@@ -62,67 +119,128 @@ def formatToCircles(moduleTransitions):
         ]
     # The circles code uses the "events" field to normalize the values between files with different number of events
     # Here we set it to 1 for the total events because the total is already normalized per transition
-        doc["total"]["events"] = 1
-        doc["total"]["label"] = "Job"
-        doc["total"]["type"] = "Job"
+    doc["total"]["events"] = 1
+    doc["total"]["label"] = "Job"
+    doc["total"]["type"] = "Job"
+    # Initialize totals for all transition types and allocation types
+    for transType in transitionTypes:
         for allocType in allocTypes:
-            doc["total"][f"{allocType} {transitionType}"] = 0
+            doc["total"][f"{allocType} {transType}"] = 0
 
+    # First pass: collect all unique module keys across all transitions
+    all_module_keys = set()
     for transitionType, moduleTransition in moduleTransitions.items():
-        for label, info in moduleTransition.items():
+        for uniqueKey in moduleTransition.keys():
+            all_module_keys.add(uniqueKey)
+
+    # Initialize all modules with default values for all transitions
+    for displayKey in all_module_keys:
+        if displayKey not in modules_dict:
+            # UniqueKey namedtuple provides direct access to fields
+            modules_dict[displayKey] = {
+                "label": displayKey.moduleLabel,
+                "type": displayKey.moduleType,
+                "record": displayKey.recordName
+            }
+
+            # Initialize all transition metrics to zero
+            for transType in transitionTypes:
+                for allocType in allocTypes:
+                    modules_dict[displayKey][f"{allocType} {transType}"] = 0.0
+
+    # Second pass: populate actual values
+    for transitionType, moduleTransition in moduleTransitions.items():
+        for uniqueKey, info in moduleTransition.items():
             allocs = info.get("allocs", [])
-            if not label in modules_dict:
-                modules_dict[label] = {
-                    "label": info.get("label", label),
-                    "type": info.get("cpptype", "unknown")
-                }
-            added = 0
-            nAlloc = 0
-            nDealloc = 0
-            maxTemp = 0
-            max1Alloc = 0
-            for alloc in allocs:
-                added += alloc.get("added", 0)
-                nAlloc += alloc.get("nAlloc", 0)
-                nDealloc += alloc.get("nDealloc", 0)
-                maxTemp += alloc.get("maxTemp", 0)
-                max1Alloc += alloc.get("max1Alloc", 0)
-            ntransitions = moduleTransitions[transitionType][label]["nTransitions"]
-            if ntransitions > 0:
-                modules_dict[label][f"nAlloc {transitionType}"] = nAlloc/ntransitions
-                modules_dict[label][f"added {transitionType}"] = (added/ntransitions)/1024
-                modules_dict[label][f"maxTemp {transitionType}"] = (maxTemp/ntransitions)/1024
-                modules_dict[label][f"nDealloc {transitionType}"] = nDealloc/ntransitions
-                modules_dict[label][f"max1Alloc {transitionType}"] = (max1Alloc/ntransitions)/1024
-            else:
-                modules_dict[label][f"nAlloc {transitionType}"] = nAlloc
-                modules_dict[label][f"added {transitionType}"] = (added)/1024
-                modules_dict[label][f"maxTemp {transitionType}"] = (maxTemp)/1024
-                modules_dict[label][f"nDealloc {transitionType}"] = nDealloc
-                modules_dict[label][f"max1Alloc {transitionType}"] = max1Alloc/1024
-            doc["total"][f"nAlloc {transitionType}"] += modules_dict[label][f"nAlloc {transitionType}"]
-            doc["total"][f"nDealloc {transitionType}"] += modules_dict[label][f"nDealloc {transitionType}"]
-            doc["total"][f"maxTemp {transitionType}"] += modules_dict[label][f"maxTemp {transitionType}"]
-            doc["total"][f"added {transitionType}"] += modules_dict[label][f"added {transitionType}"]
-            doc["total"][f"max1Alloc {transitionType}"] += modules_dict[label][f"max1Alloc {transitionType}"]
 
+            # Only update metrics if this module actually has data for this transition
+            if uniqueKey in modules_dict:
+                added = 0
+                nAlloc = 0
+                nDealloc = 0
+                maxTemp = 0
+                max1Alloc = 0
+                for alloc in allocs:
+                    added += alloc.get("added", 0)
+                    nAlloc += alloc.get("nAlloc", 0)
+                    nDealloc += alloc.get("nDealloc", 0)
+                    maxTemp += alloc.get("maxTemp", 0)
+                    max1Alloc += alloc.get("max1Alloc", 0)
+                ntransitions = moduleTransitions[transitionType][uniqueKey].get("nTransitions", 0)
+                # Normalize by number of transitions if > 0, otherwise use raw values
+                divisor = max(ntransitions, 1)  # Avoid division by zero
+
+                modules_dict[uniqueKey][f"nAlloc {transitionType}"] = nAlloc / divisor
+                modules_dict[uniqueKey][f"nDealloc {transitionType}"] = nDealloc / divisor
+                modules_dict[uniqueKey][f"added {transitionType}"] = (added / divisor) / BYTES_TO_KB
+                modules_dict[uniqueKey][f"maxTemp {transitionType}"] = (maxTemp / divisor) / BYTES_TO_KB
+                modules_dict[uniqueKey][f"max1Alloc {transitionType}"] = (max1Alloc / divisor) / BYTES_TO_KB
+                doc["total"][f"nAlloc {transitionType}"] += modules_dict[uniqueKey][f"nAlloc {transitionType}"]
+                doc["total"][f"nDealloc {transitionType}"] += modules_dict[uniqueKey][f"nDealloc {transitionType}"]
+                doc["total"][f"maxTemp {transitionType}"] += modules_dict[uniqueKey][f"maxTemp {transitionType}"]
+                doc["total"][f"added {transitionType}"] += modules_dict[uniqueKey][f"added {transitionType}"]
+                doc["total"][f"max1Alloc {transitionType}"] += modules_dict[uniqueKey][f"max1Alloc {transitionType}"]
     for key in sorted(modules_dict.keys()):
         module = modules_dict[key]
-        module["events"] = moduleTransitions['event'][key].get("nTransitions")
+ 
+        # Check if this is an empty entry (record="" and all allocations are zero)
+        if module["record"] == "":
+            # Check if all allocation metrics are zero across all transition types
+            hasNonZeroAllocations = False
+            for transType in transitionTypes:
+                for allocType in allocTypes:
+                    if module.get(f"{allocType} {transType}", 0) != 0:
+                        hasNonZeroAllocations = True
+                        break
+                if hasNonZeroAllocations:
+                    break
+
+            # Skip this entry if no allocations and empty record
+            if not hasNonZeroAllocations:
+                continue
+
+        # Use the module label from the UniqueKey namedtuple for event count lookup
+        moduleLabel = key.moduleLabel
+        # Look for the corresponding regular module key for event transitions
+        eventKey = UniqueKey(moduleLabel, key.moduleType, "")
+        eventCount = moduleTransitions['event'].get(eventKey, {}).get("nTransitions", 0)
+        # Set events to 1 if it's 0 to prevent NaNs in Circles visualization
+        module["events"] = max(eventCount, 1)
         doc["modules"].append(module)
 
     return doc
 
 def main(args):
-    import sys
-    doc = json.load(args.filename)
+    try:
+        doc = json.load(args.filename)
+    except json.JSONDecodeError as e:
+        print(f"Error parsing JSON: {e}", file=sys.stderr)
+        sys.exit(1)
+    except Exception as e:
+        print(f"Error reading file: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    # Validate required fields
+    if 'cpptypes' not in doc:
+        print("Error: Missing 'cpptypes' field in input JSON", file=sys.stderr)
+        sys.exit(1)
+    if 'modules' not in doc:
+        print("Error: Missing 'modules' field in input JSON", file=sys.stderr)
+        sys.exit(1)
+
     moduleTypes = doc['cpptypes']
     moduleTransitions = dict()
     for transition in transitionTypes:
         moduleTransition = dict()
-        processModuleTransition("source", "PoolSource", doc["source"], transition, moduleTransition)
-        for moduleLabel, moduleInfo in doc["modules"].items():
-            processModuleTransition(moduleLabel, moduleTypes[moduleLabel], moduleInfo, transition, moduleTransition)
+        if transition == EVENTSETUP_TRANSITION:
+            # EventSetup transitions are handled differently - look for records with names
+            for moduleLabel, moduleInfo in doc["modules"].items():
+                processESModuleTransition(moduleLabel, moduleTypes[moduleLabel], moduleInfo, moduleTransition)
+        else:
+            # Regular transition processing
+            processModuleTransition("source", "PoolSource", doc["source"], transition, moduleTransition)
+            for moduleLabel, moduleInfo in doc["modules"].items():
+                processModuleTransition(moduleLabel, moduleTypes[moduleLabel], moduleInfo, transition, moduleTransition)
         moduleTransitions[transition] = moduleTransition
 
     json.dump(formatToCircles(moduleTransitions), sys.stdout, indent=2)