@@ -934,8 +934,9 @@ def load_all():
934
934
if cubin_name in RUNTIME_CACHE :
935
935
continue
936
936
symbol , sha256 = KERNEL_MAP [cubin_name ]
937
- get_cubin (ArtifactPath .DEEPGEMM + cubin_name , sha256 )
938
- path = FLASHINFER_CUBIN_DIR / f"{ ArtifactPath .DEEPGEMM + cubin_name } .cubin"
937
+ cubin_name = cubin_name + ".cubin"
938
+ get_cubin (ArtifactPath .DEEPGEMM + "/" + cubin_name , sha256 )
939
+ path = FLASHINFER_CUBIN_DIR / ArtifactPath .DEEPGEMM / cubin_name
939
940
assert path .exists ()
940
941
RUNTIME_CACHE [cubin_name ] = SM100FP8GemmRuntime (str (path ), symbol )
941
942
@@ -948,8 +949,9 @@ def load(name: str, code: str) -> SM100FP8GemmRuntime:
948
949
if cubin_name in RUNTIME_CACHE :
949
950
return RUNTIME_CACHE [cubin_name ]
950
951
symbol , sha256 = KERNEL_MAP [cubin_name ]
951
- get_cubin (ArtifactPath .DEEPGEMM + cubin_name , sha256 )
952
- path = FLASHINFER_CUBIN_DIR / f"{ ArtifactPath .DEEPGEMM + cubin_name } .cubin"
952
+ cubin_name = cubin_name + ".cubin"
953
+ get_cubin (ArtifactPath .DEEPGEMM + "/" + cubin_name , sha256 )
954
+ path = FLASHINFER_CUBIN_DIR / ArtifactPath .DEEPGEMM / cubin_name
953
955
assert path .exists ()
954
956
RUNTIME_CACHE [cubin_name ] = SM100FP8GemmRuntime (str (path ), symbol )
955
957
return RUNTIME_CACHE [cubin_name ]
@@ -1490,11 +1492,11 @@ def __init__(self, sha256: str):
1490
1492
self .indice = None
1491
1493
1492
1494
def init_indices (self ):
1493
- indice_path = ArtifactPath .DEEPGEMM + "kernel_map.json"
1495
+ indice_path = ArtifactPath .DEEPGEMM + "/" + " kernel_map.json"
1494
1496
assert get_cubin (indice_path , self .sha256 ), (
1495
1497
"cubin kernel map file not found, nor downloaded with matched sha256"
1496
1498
)
1497
- path = FLASHINFER_CUBIN_DIR / f" { indice_path } .json"
1499
+ path = FLASHINFER_CUBIN_DIR / indice_path
1498
1500
assert path .exists ()
1499
1501
with open (path , "r" ) as f :
1500
1502
self .indice = json .load (f )
0 commit comments