add xpu_arch_to_mem_type_multiplier

dev-tomek · web-flow · commit 4b349f054bc8 · 2025-12-07T21:09:37.000+01:00
diff --git a/third_party/proton/proton/specs.py b/third_party/proton/proton/specs.py
@@ -18,6 +18,12 @@
     'gfx950': 8.0 * 1e12,
 }
 
+xpu_arch_to_mem_type_multiplier = {
+    "pvc": 2,
+    "dg2": 8,
+    "bmg": 8,
+}
+
 # FP8 Matrix Performance(FLOPS/clock/CU)
 # For gfx90a we use the performance of INT8 since it doesn't support FP8 matrix operations.
 amd_fp8_flops_by_arch = {'gfx90a': 1024, 'gfx942': 4096, 'gfx950': 8192}
@@ -67,11 +73,5 @@ def max_bps(device_type, arch, bus_width, memory_clock_rate):
     elif device_type == "HIP":
         return amd_bps_by_arch[arch]
     else:
-        assert device_type == "XPU"
-        if arch == "Xe-HPC":
-            multiplier = 2
-        elif arch == "Xe2" or arch == "Xe-HPG":
-            multiplier = 8
-        else:
-            raise ValueError(f"Unsupported architecture: {arch}")
-        return multiplier * bus_width * memory_clock_rate * 1e3 / 8
+        assert device_type == "XPU" 
+        return xpu_arch_to_mem_type_multiplier[arch] * bus_width * memory_clock_rate * 1e3 / 8