Add Duration column validation test for kernel trace

ihhethan · ihhethan · commit e9709ae877aa · 2026-03-03T17:40:58.000-06:00
- Generate JSON and rocpd output from same execution using ROCPROF_OUTPUT_FORMAT
- Convert rocpd database to CSV and validate Duration column
- Compare CSV Duration with JSON-derived duration (zero tolerance)
- Verify Duration = End_Timestamp - Start_Timestamp

Test validates:
- Duration column exists in CSV output
- Duration values exactly match between JSON and CSV
- Timestamps are identical (same execution source)
- Internal consistency of Duration calculation

Addresses: SWDEV-561822
diff --git a/projects/rocprofiler-sdk/source/lib/output/generateCSV.cpp b/projects/rocprofiler-sdk/source/lib/output/generateCSV.cpp
@@ -1015,4 +1015,4 @@ generate_csv(const output_config& cfg,
     }
 }
 }  // namespace tool
-}  // namespace rocprofiler
+}  // namespace rocprofiler
diff --git a/projects/rocprofiler-sdk/tests/rocprofv3/kernel-duration-ns/CMakeLists.txt b/projects/rocprofiler-sdk/tests/rocprofv3/kernel-duration-ns/CMakeLists.txt
@@ -3,67 +3,60 @@
 #
 cmake_minimum_required(VERSION 3.21.0 FATAL_ERROR)
 
-project(rocprofiler-sdk-tests-rocprofv3-kernel-trace-duration LANGUAGES CXX VERSION 0.0.0)
+project(
+    rocprofiler-sdk-tests-rocprofv3-kernel-trace-duration
+    LANGUAGES CXX
+    VERSION 0.0.0)
 
 find_package(rocprofiler-sdk REQUIRED)
 find_package(Python3 REQUIRED)
 
 set(rocprofv3-env
     "${ROCPROFILER_MEMCHECK_PRELOAD_ENV}"
     "PYTHONPATH=${rocprofiler-sdk_LIB_DIR}/python${Python3_VERSION_MAJOR}.${Python3_VERSION_MINOR}/site-packages"
-)
+    "ROCPROF_OUTPUT_FORMAT=json,rocpd")
 
 rocprofiler_configure_pytest_files(CONFIG pytest.ini COPY conftest.py validate.py)
 
-# 1) Generate JSON (ground truth)
+# Generate BOTH JSON and rocpd in a SINGLE execution using environment variable
 add_test(
-    NAME rocprofv3-test-kernel-trace-duration-json
+    NAME rocprofv3-test-kernel-trace-duration-generate
     COMMAND
-        $<TARGET_FILE:rocprofiler-sdk::rocprofv3>
-        -d ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration
-        -o out_json
-        --output-format json
-        --kernel-trace
+        $<TARGET_FILE:rocprofiler-sdk::rocprofv3> -d
+        ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration -o out_combined --kernel-trace
         -- $<TARGET_FILE:simple-transpose>)
 
 set_tests_properties(
-    rocprofv3-test-kernel-trace-duration-json
-    PROPERTIES TIMEOUT 120
-               LABELS "integration-tests;kernel-trace-duration"
-               ENVIRONMENT "${rocprofv3-env}"
-               FAIL_REGULAR_EXPRESSION "${ROCPROFILER_DEFAULT_FAIL_REGEX}"
-               FIXTURES_SETUP rocprofv3-test-kernel-trace-duration-run)
-
-# 2) Generate rocpd DB
-add_test(
-    NAME rocprofv3-test-kernel-trace-duration-rocpd
-    COMMAND
-        $<TARGET_FILE:rocprofiler-sdk::rocprofv3>
-        -d ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration
-        -o out_rocpd
-        --output-format rocpd
-        --kernel-trace
-        -- $<TARGET_FILE:simple-transpose>)
-
-set_tests_properties(
-    rocprofv3-test-kernel-trace-duration-rocpd
-    PROPERTIES TIMEOUT 120
-               LABELS "integration-tests;kernel-trace-duration"
-               ENVIRONMENT "${rocprofv3-env}"
-               FAIL_REGULAR_EXPRESSION "${ROCPROFILER_DEFAULT_FAIL_REGEX}"
-               FIXTURES_REQUIRED rocprofv3-test-kernel-trace-duration-run)
-
-# 3) Convert rocpd DB -> CSV and validate vs JSON
+    rocprofv3-test-kernel-trace-duration-generate
+    PROPERTIES TIMEOUT
+               120
+               LABELS
+               "integration-tests;kernel-trace-duration"
+               ENVIRONMENT
+               "${rocprofv3-env}"
+               FAIL_REGULAR_EXPRESSION
+               "${ROCPROFILER_DEFAULT_FAIL_REGEX}"
+               FIXTURES_SETUP
+               rocprofv3-test-kernel-trace-duration-data)
+
+# Validate: Convert rocpd DB -> CSV and compare with JSON
 add_test(
     NAME rocprofv3-test-kernel-trace-duration-validation
-    COMMAND ${Python3_EXECUTABLE} ${CMAKE_CURRENT_BINARY_DIR}/validate.py
-            --json-input ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration/out_json_results.json
-            --db-input ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration/out_rocpd_results.db)
+    COMMAND
+        ${Python3_EXECUTABLE} ${CMAKE_CURRENT_BINARY_DIR}/validate.py --json-input
+        ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration/out_combined_results.json
+        --db-input
+        ${CMAKE_CURRENT_BINARY_DIR}/kernel-trace-duration/out_combined_results.db)
 
 set_tests_properties(
     rocprofv3-test-kernel-trace-duration-validation
-    PROPERTIES TIMEOUT 120
-               LABELS "integration-tests;kernel-trace-duration"
-               ENVIRONMENT "${rocprofv3-env}"
-               DEPENDS "rocprofv3-test-kernel-trace-duration-json;rocprofv3-test-kernel-trace-duration-rocpd"
-               FAIL_REGULAR_EXPRESSION "${ROCPROFILER_DEFAULT_FAIL_REGEX}")
+    PROPERTIES TIMEOUT
+               120
+               LABELS
+               "integration-tests;kernel-trace-duration"
+               ENVIRONMENT
+               "${rocprofv3-env}"
+               FIXTURES_REQUIRED
+               rocprofv3-test-kernel-trace-duration-data
+               FAIL_REGULAR_EXPRESSION
+               "${ROCPROFILER_DEFAULT_FAIL_REGEX}")
diff --git a/projects/rocprofiler-sdk/tests/rocprofv3/kernel-duration-ns/conftest.py b/projects/rocprofiler-sdk/tests/rocprofv3/kernel-duration-ns/conftest.py
@@ -42,4 +42,4 @@ def json_data(request):
 def db_path(request):
     path = request.config.getoption("--db-input")
     assert os.path.isfile(path), f"missing rocpd DB input: {path}"
-    return path
+    return path
diff --git a/projects/rocprofiler-sdk/tests/rocprofv3/kernel-duration-ns/validate.py b/projects/rocprofiler-sdk/tests/rocprofv3/kernel-duration-ns/validate.py
@@ -2,8 +2,7 @@
 
 # MIT License
 #
-# Copyright (c) 2024-2025 Advanced Micro Devices,
-# Inc. All rights reserved.
+# Copyright (c) 2024-2025 Advanced Micro Devices, Inc.
 #
 # Permission is hereby granted, free of charge, to any person obtaining a copy
 # of this software and associated documentation files (the "Software"), to deal
@@ -23,109 +22,196 @@
 # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 # THE SOFTWARE.
 
+
 import os
 import sys
 import csv
-import json
 import subprocess
 import pytest
 
-def node_exists(name, data, min_len=1):
-    assert name in data, f"missing key: {name}"
-    assert data[name] is not None, f"key is None: {name}"
-    if hasattr(data[name], "__len__"):
-        assert len(data[name]) >= min_len, f"key '{name}' too small"
 
 def run_rocpd_convert(db_path, out_dir):
+    """Convert rocpd database to CSV format."""
     os.makedirs(out_dir, exist_ok=True)
     cmd = [sys.executable, "-m", "rocpd", "convert", "-i", db_path, "--output-format", "csv", "-d", out_dir]
     res = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
     assert res.returncode == 0, f"rocpd convert failed\ncmd={' '.join(cmd)}\nstdout={res.stdout}\nstderr={res.stderr}"
 
+
 def find_kernel_trace_csv(out_dir):
+    """Locate kernel_trace CSV file in output directory."""
     for fn in os.listdir(out_dir):
         if fn.endswith("kernel_trace.csv"):
             return os.path.join(out_dir, fn)
     assert False, f"kernel trace CSV not found in {out_dir}"
 
+
 def load_csv_rows(path):
+    """Load CSV file and return rows as list of dicts."""
     assert os.path.isfile(path), f"missing CSV: {path}"
     with open(path, newline="") as f:
         reader = csv.DictReader(f)
         rows = list(reader)
     assert len(rows) > 0, f"empty CSV: {path}"
     return rows
 
+
 def extract_json_kernel_records(json_root):
-    node_exists("rocprofiler-sdk-tool", json_root)
+    """Extract kernel dispatch records from JSON output."""
+    assert "rocprofiler-sdk-tool" in json_root, "missing rocprofiler-sdk-tool in JSON"
     tool = json_root["rocprofiler-sdk-tool"]
     if isinstance(tool, list) and len(tool) > 0:
         tool = tool[0]
-    node_exists("buffer_records", tool)
+    assert "buffer_records" in tool, "missing buffer_records in JSON"
     br = tool["buffer_records"]
+    
     for key in ("kernel_dispatch", "kernel_trace", "kernel_dispatch_trace"):
         if key in br and isinstance(br[key], list) and len(br[key]) > 0:
             return br[key]
-    assert False, f"cannot find kernel dispatch records in buffer_records keys={list(br.keys())}"
+    assert False, f"no kernel dispatch records found in JSON buffer_records keys={list(br.keys())}"
 
-def build_json_map(records):
+
+def build_json_duration_map(records):
+    """Build map of dispatch_id -> (start, end, duration) from JSON records."""
     m = {}
     for r in records:
+        # Extract dispatch ID
         dispatch_info = r.get("dispatch_info", {})
         dispatch_id = dispatch_info.get("dispatch_id") if isinstance(dispatch_info, dict) else None
-        corr_id = r.get("correlation_id", {})
-        if isinstance(corr_id, dict):
-            corr_id = corr_id.get("internal", 0)
+        
+        # Fallback to correlation_id if no dispatch_id
+        if dispatch_id is None:
+            corr_id = r.get("correlation_id", {})
+            if isinstance(corr_id, dict):
+                dispatch_id = corr_id.get("internal", 0)
+            else:
+                dispatch_id = corr_id
+        
+        # Extract timestamps
         start = r.get("start_timestamp")
         end = r.get("end_timestamp")
-        assert start is not None and end is not None, f"missing start/end in json record: {r}"
+        assert start is not None and end is not None, f"missing timestamps in JSON record: {r}"
+        
         start = int(start)
         end = int(end)
-        assert start > 0 and end > 0, f"non-positive timestamps start={start} end={end}"
+        assert start > 0 and end > 0, f"invalid timestamps start={start} end={end}"
         assert end >= start, f"end before start: start={start} end={end}"
-        key = dispatch_id if dispatch_id is not None else corr_id
-        assert key is not None, f"no key to match json record: {r}"
-        m[str(key)] = (start, end)
-    assert len(m) > 0, "no records found in JSON"
+        
+        duration = end - start
+        m[str(dispatch_id)] = (start, end, duration)
+    
+    assert len(m) > 0, "no kernel records extracted from JSON"
     return m
 
+
 def test_rocpd_kernel_trace_duration(json_data, db_path, tmp_path):
+    """
+    Test that rocpd CSV output contains Duration column and values match JSON.
+    
+    Test strategy:
+    1. Generate JSON and rocpd output from SAME execution (using ROCPROF_OUTPUT_FORMAT env var)
+    2. Use rocpd to convert database to CSV
+    3. Compare CSV Duration with JSON-derived duration
+    
+    Since JSON and rocpd come from the same execution, timestamps should be IDENTICAL.
+    We expect ZERO tolerance for differences.
+    
+    Validates:
+    - Duration column exists in CSV
+    - Duration values EXACTLY match between JSON and CSV (zero tolerance)
+    - Duration correctly calculated as End - Start
+    - Start and End timestamps also match exactly
+    """
+    # Convert rocpd DB to CSV
     out_dir = tmp_path / "rocpd_csv"
     run_rocpd_convert(db_path, str(out_dir))
     csv_path = find_kernel_trace_csv(str(out_dir))
-    rows = load_csv_rows(csv_path)
+    csv_rows = load_csv_rows(csv_path)
     
-    # Main test: verify Duration column exists
-    assert "Duration" in rows[0], f"missing 'Duration' column; columns={list(rows[0].keys())}"
+    # Verify Duration column exists
+    assert "Duration" in csv_rows[0], f"missing 'Duration' column; columns={list(csv_rows[0].keys())}"
     
+    # Extract JSON data
     json_records = extract_json_kernel_records(json_data)
-    json_map = build_json_map(json_records)
+    json_map = build_json_duration_map(json_records)
     
-    for row in rows:
-        key = row.get("Dispatch_Id") or row.get("Correlation_Id")
-        assert key is not None, f"cannot match row: {row}"
+    # Track statistics
+    matched_count = 0
+    total_count = len(csv_rows)
+    mismatches = []
+    
+    for csv_row in csv_rows:
+        # Get CSV values
+        csv_start = int(csv_row["Start_Timestamp"])
+        csv_end = int(csv_row["End_Timestamp"])
+        csv_dur = int(csv_row["Duration"])
+        
+        # Validate CSV internal consistency
+        assert csv_start > 0 and csv_end > 0, f"invalid CSV timestamps: start={csv_start} end={csv_end}"
+        assert csv_end >= csv_start, f"CSV end before start: {csv_end} < {csv_start}"
+        assert csv_dur >= 0, f"negative CSV duration: {csv_dur}"
+        assert csv_dur == (csv_end - csv_start), f"CSV duration mismatch: {csv_dur} != {csv_end - csv_start}"
         
-        start = int(row["Start_Timestamp"])
-        end = int(row["End_Timestamp"])
-        dur = int(row["Duration"])
+        # Match with JSON and require EXACT match (zero tolerance)
+        dispatch_id = csv_row.get("Dispatch_Id") or csv_row.get("Correlation_Id")
+        if dispatch_id and str(dispatch_id) in json_map:
+            matched_count += 1
+            json_start, json_end, json_dur = json_map[str(dispatch_id)]
+            
+            # Check for exact match on all three values
+            start_diff = csv_start - json_start
+            end_diff = csv_end - json_end
+            dur_diff = csv_dur - json_dur
+            
+            if start_diff != 0 or end_diff != 0 or dur_diff != 0:
+                mismatches.append({
+                    'dispatch_id': dispatch_id,
+                    'csv_start': csv_start,
+                    'json_start': json_start,
+                    'start_diff': start_diff,
+                    'csv_end': csv_end,
+                    'json_end': json_end,
+                    'end_diff': end_diff,
+                    'csv_dur': csv_dur,
+                    'json_dur': json_dur,
+                    'dur_diff': dur_diff
+                })
+    
+    # Report any mismatches
+    if mismatches:
+        error_lines = [
+            "",
+            "TIMESTAMP MISMATCHES DETECTED",
+            f"{'Dispatch':<10} {'Start Diff':<12} {'End Diff':<12} {'Dur Diff':<12}",
+            "=" * 50
+        ]
         
-        # Verify timestamps are reasonable
-        assert start > 0 and end > 0, f"non-positive timestamps in CSV: start={start} end={end}"
-        assert end >= start, f"end before start in CSV: start={start} end={end}"
-        assert dur >= 0, f"negative duration in CSV: dur={dur}"
+        for m in mismatches[:10]:  # Show first 10
+            error_lines.append(
+                f"{m['dispatch_id']:<10} {m['start_diff']:<12} {m['end_diff']:<12} {m['dur_diff']:<12}"
+            )
         
-        # Verify Duration column is correctly calculated from Start and End
-        assert dur == (end - start), f"duration mismatch in CSV: dur={dur} vs calculated={end - start}"
+        if len(mismatches) > 10:
+            error_lines.append(f"... and {len(mismatches) - 10} more mismatches")
         
-        if str(key) in json_map:
-            jstart, jend = json_map[str(key)]
-            json_dur = jend - jstart
-            diff = abs(json_dur - dur)
-            # Allow small differences due to clock skew/adjustments
-            # Just warn if difference is significant (>10% or >1000ns)
-            if diff > 1000 and diff > dur * 0.1:
-                print(f"INFO: Large timestamp difference for key={key}: csv_dur={dur} json_dur={json_dur} diff={diff}")
+        # Fail the test with detailed error
+        first = mismatches[0]
+        error_msg = "\n".join(error_lines) + "\n\n" + (
+            f"Timestamp mismatch detected for dispatch {first['dispatch_id']}:\n"
+            f"  CSV:  start={first['csv_start']}, end={first['csv_end']}, duration={first['csv_dur']}\n"
+            f"  JSON: start={first['json_start']}, end={first['json_end']}, duration={first['json_dur']}\n"
+            f"  Diff: start={first['start_diff']}, end={first['end_diff']}, duration={first['dur_diff']}\n"
+            f"Total mismatches: {len(mismatches)}/{total_count}\n"
+            f"NOTE: Since JSON and rocpd come from the same execution, timestamps should be identical."
+        )
+        assert False, error_msg
+    
+    # Ensure we matched all records
+    assert matched_count > 0, f"No CSV rows matched with JSON records"
+    assert matched_count == total_count, f"Only {matched_count}/{total_count} CSV rows matched JSON"
+
 
 if __name__ == "__main__":
     rc = pytest.main(["-x", __file__] + sys.argv[1:])
-    sys.exit(rc)
+    sys.exit(rc)
+    

Original file line number	Diff line number	Diff line change
`@@ -1015,4 +1015,4 @@ generate_csv(const output_config& cfg,`
`1015`	`1015`	`}`
`1016`	`1016`	`}`
`1017`	`1017`	`} // namespace tool`
`1018`		`-} // namespace rocprofiler`
	`1018`	`+} // namespace rocprofiler`