[flang-commits] [flang] 5c40133 - [flang][cuda] Add bind name for __dsqrt_rd and __dsqrt_ru interfaces (#153290)
via flang-commits
flang-commits at lists.llvm.org
Wed Aug 13 11:38:35 PDT 2025
Author: Valentin Clement (バレンタイン クレメン)
Date: 2025-08-13T18:38:31Z
New Revision: 5c401331d73f18bbd83929db20724282b322d1f4
URL: https://github.com/llvm/llvm-project/commit/5c401331d73f18bbd83929db20724282b322d1f4
DIFF: https://github.com/llvm/llvm-project/commit/5c401331d73f18bbd83929db20724282b322d1f4.diff
LOG: [flang][cuda] Add bind name for __dsqrt_rd and __dsqrt_ru interfaces (#153290)
Added:
Modified:
flang/module/cudadevice.f90
flang/test/Lower/CUDA/cuda-device-proc.cuf
Removed:
################################################################################
diff --git a/flang/module/cudadevice.f90 b/flang/module/cudadevice.f90
index c026bc5b284b8..1bccff1b5a892 100644
--- a/flang/module/cudadevice.f90
+++ b/flang/module/cudadevice.f90
@@ -695,15 +695,15 @@ attributes(device) real(8) function sinpi(x) bind(c,name='__nv_sinpi')
end function
end interface
- interface __dsqrt_ru
- attributes(device) double precision function __dsqrt_ru(x) bind(c)
+ interface __dsqrt_rd
+ attributes(device) double precision function __dsqrt_rd(x) bind(c, name='__nv_dsqrt_rd')
!dir$ ignore_tkr (d) x
double precision, value :: x
end function
end interface
- interface __dsqrt_rd
- attributes(device) double precision function __dsqrt_rd(x) bind(c)
+ interface __dsqrt_ru
+ attributes(device) double precision function __dsqrt_ru(x) bind(c, name='__nv_dsqrt_ru')
!dir$ ignore_tkr (d) x
double precision, value :: x
end function
diff --git a/flang/test/Lower/CUDA/cuda-device-proc.cuf b/flang/test/Lower/CUDA/cuda-device-proc.cuf
index a01935876360a..676e455b06e2f 100644
--- a/flang/test/Lower/CUDA/cuda-device-proc.cuf
+++ b/flang/test/Lower/CUDA/cuda-device-proc.cuf
@@ -77,6 +77,8 @@ attributes(global) subroutine devsub()
ai = __mul24(ai, ai)
ai = __umul24(ai, ai)
af = __powf(af, af)
+ ad = __dsqrt_rd(ad)
+ ad = __dsqrt_ru(ad)
end
! CHECK-LABEL: func.func @_QPdevsub() attributes {cuf.proc_attr = #cuf.cuda_proc<global>}
@@ -141,6 +143,8 @@ end
! CHECK: %{{.*}} = fir.call @__nv_mul24(%{{.*}}, %{{.*}}) proc_attrs<bind_c> fastmath<contract> : (i32, i32) -> i32
! CHECK: %{{.*}} = fir.call @__nv_umul24(%{{.*}}, %{{.*}}) proc_attrs<bind_c> fastmath<contract> : (i32, i32) -> i32
! CHECK: %{{.*}} = fir.call @__nv_powf(%{{.*}}, %{{.*}}) proc_attrs<bind_c> fastmath<contract> : (f32, f32) -> f32
+! CHECK: %{{.*}} = fir.call @__nv_dsqrt_rd(%{{.*}}) proc_attrs<bind_c> fastmath<contract> : (f64) -> f64
+! CHECK: %{{.*}} = fir.call @__nv_dsqrt_ru(%{{.*}}) proc_attrs<bind_c> fastmath<contract> : (f64) -> f64
subroutine host1()
integer, device :: a(32)
More information about the flang-commits
mailing list