From ad1941a1127478c61ee3483b37ef0ead5b47d350 Mon Sep 17 00:00:00 2001 From: Valentin Clement Date: Fri, 8 Aug 2025 14:35:00 -0700 Subject: [PATCH] [flang][cuda] Add bind name for __fss interface --- flang/module/cudadevice.f90 | 4 ++-- flang/test/Lower/CUDA/cuda-device-proc.cuf | 7 +++++++ 2 files changed, 9 insertions(+), 2 deletions(-) diff --git a/flang/module/cudadevice.f90 b/flang/module/cudadevice.f90 index d0c312c09353f..80ae0abf76687 100644 --- a/flang/module/cudadevice.f90 +++ b/flang/module/cudadevice.f90 @@ -743,11 +743,11 @@ attributes(device) real(8) function sinpi(x) bind(c,name='__nv_sinpi') end interface interface __ffs - attributes(device) integer function __ffs(i) bind(c) + attributes(device) integer function __ffs(i) bind(c, name='__nv_ffs') !dir$ ignore_tkr (d) i integer, value :: i end function - attributes(device) integer function __ffsll(i) bind(c) + attributes(device) integer function __ffsll(i) bind(c, name='__nv_ffsll') !dir$ ignore_tkr (d) i integer(8), value :: i end function diff --git a/flang/test/Lower/CUDA/cuda-device-proc.cuf b/flang/test/Lower/CUDA/cuda-device-proc.cuf index d5e614a83b354..db034f40a2506 100644 --- a/flang/test/Lower/CUDA/cuda-device-proc.cuf +++ b/flang/test/Lower/CUDA/cuda-device-proc.cuf @@ -11,6 +11,7 @@ attributes(global) subroutine devsub() integer(8) :: al integer(8) :: time integer :: smalltime + integer(4) :: res call syncthreads() call syncwarp(1) @@ -49,6 +50,9 @@ attributes(global) subroutine devsub() smalltime = clock() time = clock64() time = globalTimer() + + res = __ffs(ai) + res = __ffs(al) end ! CHECK-LABEL: func.func @_QPdevsub() attributes {cuf.proc_attr = #cuf.cuda_proc} @@ -89,6 +93,9 @@ end ! CHECK: %{{.*}} = nvvm.read.ptx.sreg.clock64 : i64 ! CHECK: %{{.*}} = nvvm.read.ptx.sreg.globaltimer : i64 +! CHECK: %{{.*}} = fir.call @__nv_ffs(%{{.*}}) proc_attrs fastmath : (i32) -> i32 +! CHECK: %{{.*}} = fir.call @__nv_ffsll(%{{.*}}) proc_attrs fastmath : (i64) -> i32 + subroutine host1() integer, device :: a(32) integer, device :: ret