Correctness check for GPU Instruction Count sample (#16)

idubinov · web-flow · commit 4b7f02c130a7 · 2023-12-07T12:03:01.000+01:00
* Check correctness for gpu_inst_count tool
diff --git a/VERSION b/VERSION
@@ -1 +1 @@
-0.49.17
+0.49.18
diff --git a/tests/samples/gpu_inst_count.py b/tests/samples/gpu_inst_count.py
@@ -21,39 +21,43 @@ def build(path):
     return stderr
   return None
 
-def parse(output):
+def parseTotal(output, countString=None):
   lines = output.split("\n")
   total_count = 0
   for line in lines:
     if line.find("[INFO]") != -1:
       continue
     if line.find("[") != 0:
       continue
+    if countString != None and countString not in line:
+      continue
     items = line.split("]")
     if len(items) == 2:
       if items[0].strip() and items[1].strip():
         count = int(items[0].lstrip("[").strip())
         if count < 0:
           return False
         total_count += count
-  if total_count <= 0:
-    return False
-  return True
+  return total_count
 
-def run(path, option):
+def parse(output):
+  return False if parseTotal(output) <= 0 else True
+
+def getTestAppCommand(option, matrixSize, iterations):
   if option == "cl":
     app_folder = utils.get_sample_executable_path("cl_gemm")
     app_file = os.path.join(app_folder, "cl_gemm")
-    command = ["./gpu_inst_count", app_file, "gpu", "1024", "1"]
+    return ["./gpu_inst_count", app_file, "gpu", f"{matrixSize}", f"{iterations}"]
   elif option == "ze":
     app_folder = utils.get_sample_executable_path("ze_gemm")
     app_file = os.path.join(app_folder, "ze_gemm")
-    command = ["./gpu_inst_count", app_file, "1024", "1"]
+    return ["./gpu_inst_count", app_file, f"{matrixSize}", f"{iterations}"]
   else:
     app_folder = utils.get_sample_executable_path("dpc_gemm")
     app_file = os.path.join(app_folder, "dpc_gemm")
-    command = ["./gpu_inst_count", app_file, "gpu", "1024", "1"]
-  stdout, stderr = utils.run_process(command, path)
+    return ["./gpu_inst_count", app_file, "gpu",  f"{matrixSize}", f"{iterations}"]
+
+def isValidOutput(stdout, stderr):
   if not stdout:
     return "stdout is empty"
   if not stderr:
@@ -66,6 +70,42 @@ def run(path, option):
     return stderr
   return None
 
+def run(path, option):
+  # Smoke test
+  command = getTestAppCommand(option, 1024, 1)
+  stdout, stderr = utils.run_process(command, path)
+  res = isValidOutput(stdout, stderr)
+  if res != None: return res
+
+  # Correctness test
+  # Test is based on relative results of instruction count. Test appplicaiton
+  # has N^3 complexity. Correctness based on number of executed multiply instructions
+  # for matrix sizes {1, 2, 4} is checked as: (-12*r1-r2+r4)/44==(4*r1-r2)/-4:)
+
+  baseSize = 128
+  command = getTestAppCommand(option, baseSize * 1, 1)
+  stdout, stderr = utils.run_process(command, path)
+  res = isValidOutput(stdout, stderr)
+  if res != None: return res
+  r1 = parseTotal(stderr, 'mad')
+
+  command = getTestAppCommand(option, baseSize * 2, 1)
+  stdout, stderr = utils.run_process(command, path)
+  res = isValidOutput(stdout, stderr)
+  if res != None: return res
+  r2 = parseTotal(stderr, 'mad')
+
+  command = getTestAppCommand(option, baseSize * 4, 1)
+  stdout, stderr = utils.run_process(command, path)
+  res = isValidOutput(stdout, stderr)
+  if res != None: return res
+  r4 = parseTotal(stderr, 'mad')
+
+  if (-12*r1 -r2 +r4)/44 != (4*r1 - r2)/-4:
+    return f"Correctness check failed: {r1 * 8} != {r2}"
+
+  return None
+
 def main(option):
   path = utils.get_sample_build_path("gpu_inst_count")
   if option == "cl":