Skip to content

Commit 3f5b505

Browse files
Hardcode84Diptorup Deb
authored andcommitted
Rambo f64 emulation
1 parent 958f98b commit 3f5b505

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

dpbench/benchmarks/rambo/rambo_numba_mlir_k.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
import numba_mlir.kernel as nb
88

99

10-
@nb.kernel
10+
@nb.kernel(gpu_fp64_truncate="auto")
1111
def _rambo(C1, F1, Q1, nout, output):
1212
i = nb.get_global_id(0)
1313
for j in range(nout):

dpbench/benchmarks/rambo/rambo_numba_mlir_n.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
import numpy as np
77

88

9-
@nb.njit
9+
@nb.njit(parallel=True, fastmath=True, gpu_fp64_truncate="auto")
1010
def rambo(nevts, nout, C1, F1, Q1, output):
1111
C = 2.0 * C1 - 1.0
1212
S = np.sqrt(1 - np.square(C))

dpbench/benchmarks/rambo/rambo_numba_mlir_p.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
import numpy as np
88

99

10-
@nb.njit
10+
@nb.njit(parallel=True, fastmath=True, gpu_fp64_truncate="auto")
1111
def rambo(nevts, nout, C1, F1, Q1, output):
1212
for i in numba.prange(nevts):
1313
for j in numba.prange(nout):

0 commit comments

Comments
 (0)