From c6519ef8bfaeb9835006902cf6ca755d0a4a1358 Mon Sep 17 00:00:00 2001 From: Wenju He Date: Mon, 12 Aug 2024 04:33:13 -0700 Subject: [PATCH] Translate floating-point atomic_compare_exchange as integer (#2668) OpenCL spec supports atomic_float/atomic_double type for atomic_compare_exchange* functions. However, value and return type in OpAtomicCompareExchange in SPIR-V spec must be integer type. Therefore, in OCLToSPIRV translation we need to translate floating-point type to corresponding integer variant that has the same type size. Floating-point value is bitcasted so that bits remain the same. Original commit: https://github.com/KhronosGroup/SPIRV-LLVM-Translator/commit/e5544014fba77d3 --- llvm-spirv/lib/SPIRV/OCLToSPIRV.cpp | 12 ++ .../AtomicCompareExchangeExplicit_cl20.cl | 146 +++++++++++++----- .../transcoding/AtomicCompareExchange_cl20.ll | 68 ++++++++ 3 files changed, 186 insertions(+), 40 deletions(-) diff --git a/llvm-spirv/lib/SPIRV/OCLToSPIRV.cpp b/llvm-spirv/lib/SPIRV/OCLToSPIRV.cpp index 80c93f5a6bf54..be04f0ad91f6d 100644 --- a/llvm-spirv/lib/SPIRV/OCLToSPIRV.cpp +++ b/llvm-spirv/lib/SPIRV/OCLToSPIRV.cpp @@ -485,6 +485,18 @@ CallInst *OCLToSPIRVBase::visitCallAtomicCmpXchg(CallInst *CI) { auto Mutator = mutateCallInst(CI, kOCLBuiltinName::AtomicCmpXchgStrong); Value *Expected = Mutator.getArg(1); Type *MemTy = Mutator.getArg(2)->getType(); + if (MemTy->isFloatTy() || MemTy->isDoubleTy()) { + MemTy = + MemTy->isFloatTy() ? Type::getInt32Ty(*Ctx) : Type::getInt64Ty(*Ctx); + Mutator.replaceArg( + 0, + {Mutator.getArg(0), + TypedPointerType::get( + MemTy, Mutator.getArg(0)->getType()->getPointerAddressSpace())}); + Mutator.mapArg(2, [=](IRBuilder<> &Builder, Value *V) { + return Builder.CreateBitCast(V, MemTy); + }); + } assert(MemTy->isIntegerTy() && "In SPIR-V 1.0 arguments of OpAtomicCompareExchange must be " "an integer type scalars"); diff --git a/llvm-spirv/test/transcoding/AtomicCompareExchangeExplicit_cl20.cl b/llvm-spirv/test/transcoding/AtomicCompareExchangeExplicit_cl20.cl index 166cda9284fc4..7eefe0dafd3e0 100644 --- a/llvm-spirv/test/transcoding/AtomicCompareExchangeExplicit_cl20.cl +++ b/llvm-spirv/test/transcoding/AtomicCompareExchangeExplicit_cl20.cl @@ -6,46 +6,112 @@ // RUN: llvm-spirv -r --spirv-target-env=CL2.0 %t.spv -o %t.rev.bc // RUN: llvm-dis < %t.rev.bc | FileCheck %s --check-prefix=CHECK-LLVM -__kernel void testAtomicCompareExchangeExplicit_cl20( - volatile global atomic_int* object, - global int* expected, - int desired) -{ - // Values of memory order and memory scope arguments correspond to SPIR-2.0 spec. - atomic_compare_exchange_strong_explicit(object, expected, desired, - memory_order_release, // 3 - memory_order_relaxed // 0 - ); // by default, assume device scope = 2 - atomic_compare_exchange_strong_explicit(object, expected, desired, - memory_order_acq_rel, // 4 - memory_order_relaxed, // 0 - memory_scope_work_group // 1 - ); - atomic_compare_exchange_weak_explicit(object, expected, desired, - memory_order_release, // 3 - memory_order_relaxed // 0 - ); // by default, assume device scope = 2 - atomic_compare_exchange_weak_explicit(object, expected, desired, - memory_order_acq_rel, // 4 - memory_order_relaxed, // 0 - memory_scope_work_group // 1 - ); +#define DEFINE_KERNEL(TYPE) \ +__kernel void testAtomicCompareExchangeExplicit_cl20_##TYPE( \ + volatile global atomic_##TYPE* object, \ + global TYPE* expected, \ + TYPE desired) \ +{ \ + /* Values of memory order and memory scope arguments correspond to SPIR-2.0 spec. */ \ + atomic_compare_exchange_strong_explicit(object, expected, desired, \ + memory_order_release, /* 3 */ \ + memory_order_relaxed /* 0 */ \ + ); /* by default, assume device scope = 2 */ \ + atomic_compare_exchange_strong_explicit(object, expected, desired, \ + memory_order_acq_rel, /* 4 */ \ + memory_order_relaxed, /* 0 */ \ + memory_scope_work_group /* 1 */ \ + ); \ + atomic_compare_exchange_weak_explicit(object, expected, desired, \ + memory_order_release, /* 3 */ \ + memory_order_relaxed /* 0 */ \ + ); /* by default, assume device scope = 2 */ \ + atomic_compare_exchange_weak_explicit(object, expected, desired, \ + memory_order_acq_rel, /* 4 */ \ + memory_order_relaxed, /* 0 */ \ + memory_scope_work_group /* 1 */ \ + ); \ } -//CHECK-SPIRV: TypeInt [[int:[0-9]+]] 32 0 +DEFINE_KERNEL(int) +DEFINE_KERNEL(float) +DEFINE_KERNEL(double) + +//CHECK-SPIRV: TypeInt [[int32:[0-9]+]] 32 0 +//CHECK-SPIRV: TypeInt [[int64:[0-9]+]] 64 0 //; Constants below correspond to the SPIR-V spec -//CHECK-SPIRV-DAG: Constant [[int]] [[DeviceScope:[0-9]+]] 1 -//CHECK-SPIRV-DAG: Constant [[int]] [[WorkgroupScope:[0-9]+]] 2 -//CHECK-SPIRV-DAG: Constant [[int]] [[ReleaseMemSem:[0-9]+]] 4 -//CHECK-SPIRV-DAG: Constant [[int]] [[RelaxedMemSem:[0-9]+]] 0 -//CHECK-SPIRV-DAG: Constant [[int]] [[AcqRelMemSem:[0-9]+]] 8 - -//CHECK-SPIRV: AtomicCompareExchange {{[0-9]+}} {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] -//CHECK-SPIRV: AtomicCompareExchange {{[0-9]+}} {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] -//CHECK-SPIRV: AtomicCompareExchange {{[0-9]+}} {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] -//CHECK-SPIRV: AtomicCompareExchange {{[0-9]+}} {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] - -//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected5.as, i32 %desired, i32 3, i32 0, i32 2) -//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected8.as, i32 %desired, i32 4, i32 0, i32 1) -//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected11.as, i32 %desired, i32 3, i32 0, i32 2) -//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected14.as, i32 %desired, i32 4, i32 0, i32 1) +//CHECK-SPIRV-DAG: Constant [[int32]] [[DeviceScope:[0-9]+]] 1 +//CHECK-SPIRV-DAG: Constant [[int32]] [[WorkgroupScope:[0-9]+]] 2 +//CHECK-SPIRV-DAG: Constant [[int32]] [[ReleaseMemSem:[0-9]+]] 4 +//CHECK-SPIRV-DAG: Constant [[int32]] [[RelaxedMemSem:[0-9]+]] 0 +//CHECK-SPIRV-DAG: Constant [[int32]] [[AcqRelMemSem:[0-9]+]] 8 + +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] + +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int32]] {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] + +//CHECK-SPIRV: AtomicCompareExchange [[int64]] {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int64]] {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int64]] {{[0-9]+}} {{[0-9]+}} [[DeviceScope]] [[ReleaseMemSem]] [[RelaxedMemSem]] +//CHECK-SPIRV: AtomicCompareExchange [[int64]] {{[0-9]+}} {{[0-9]+}} [[WorkgroupScope]] [[AcqRelMemSem]] [[RelaxedMemSem]] + +//CHECK-LLVM-LABEL: define spir_kernel void @testAtomicCompareExchangeExplicit_cl20_int( +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected{{.*}}, i32 %desired, i32 3, i32 0, i32 2) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected{{.*}}, i32 %desired, i32 4, i32 0, i32 1) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected{{.*}}, i32 %desired, i32 3, i32 0, i32 2) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) %0, ptr addrspace(4) %expected{{.*}}, i32 %desired, i32 4, i32 0, i32 1) + +//CHECK-LLVM-LABEL: define spir_kernel void @testAtomicCompareExchangeExplicit_cl20_float( +//CHECK-LLVM: [[OBJECT:%[0-9]+]] = addrspacecast ptr addrspace(1) %object to ptr addrspace(4) +//CHECK-LLVM: [[EXPECTED:%[0-9]+]] = addrspacecast ptr addrspace(1) %expected to ptr addrspace(4) +//CHECK-LLVM: [[CAST1:%[0-9]+]] = bitcast float %desired to i32 +//CHECK-LLVM: %exp = load i32, ptr addrspace(4) [[EXPECTED]], align 4 +//CHECK-LLVM: store i32 %exp, ptr [[EXPECTED_ALLOCA:%expected[0-9]+]], align 4 +//CHECK-LLVM: [[EXPECTED_AS1:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS1]], i32 [[CAST1]], i32 3, i32 0, i32 2) +//CHECK-LLVM: [[CAST2:%[0-9]+]] = bitcast float %desired to i32 +//CHECK-LLVM: [[LOAD2:%exp[0-9]+]] = load i32, ptr addrspace(4) [[EXPECTED]], align 4 +//CHECK-LLVM: store i32 [[LOAD2]], ptr [[EXPECTED_ALLOCA2:%expected[0-9]+]], align 4 +//CHECK-LLVM: [[EXPECTED_AS2:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA2]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS2]], i32 [[CAST2]], i32 4, i32 0, i32 1) +//CHECK-LLVM: [[CAST3:%[0-9]+]] = bitcast float %desired to i32 +//CHECK-LLVM: [[LOAD3:%exp[0-9]+]] = load i32, ptr addrspace(4) [[EXPECTED]], align 4 +//CHECK-LLVM: store i32 [[LOAD3]], ptr [[EXPECTED_ALLOCA3:%expected[0-9]+]], align 4 +//CHECK-LLVM: [[EXPECTED_AS3:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA3]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS3]], i32 [[CAST3]], i32 3, i32 0, i32 2) +//CHECK-LLVM: [[CAST4:%[0-9]+]] = bitcast float %desired to i32 +//CHECK-LLVM: [[LOAD4:%exp[0-9]+]] = load i32, ptr addrspace(4) [[EXPECTED]], align 4 +//CHECK-LLVM: store i32 [[LOAD4]], ptr [[EXPECTED_ALLOCA4:%expected[0-9]+]], align 4 +//CHECK-LLVM: [[EXPECTED_AS4:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA4]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS4]], i32 [[CAST4]], i32 4, i32 0, i32 1) + + +//CHECK-LLVM-LABEL: define spir_kernel void @testAtomicCompareExchangeExplicit_cl20_double( +//CHECK-LLVM: [[OBJECT:%[0-9]+]] = addrspacecast ptr addrspace(1) %object to ptr addrspace(4) +//CHECK-LLVM: [[EXPECTED:%[0-9]+]] = addrspacecast ptr addrspace(1) %expected to ptr addrspace(4) +//CHECK-LLVM: [[CAST1:%[0-9]+]] = bitcast double %desired to i64 +//CHECK-LLVM: %exp = load i64, ptr addrspace(4) [[EXPECTED]], align 8 +//CHECK-LLVM: store i64 %exp, ptr [[EXPECTED_ALLOCA:%expected[0-9]+]], align 8 +//CHECK-LLVM: [[EXPECTED_AS1:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiclPU3AS4ll12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS1]], i64 [[CAST1]], i32 3, i32 0, i32 2) +//CHECK-LLVM: [[CAST2:%[0-9]+]] = bitcast double %desired to i64 +//CHECK-LLVM: [[LOAD2:%exp[0-9]+]] = load i64, ptr addrspace(4) [[EXPECTED]], align 8 +//CHECK-LLVM: store i64 [[LOAD2]], ptr [[EXPECTED_ALLOCA2:%expected[0-9]+]], align 8 +//CHECK-LLVM: [[EXPECTED_AS2:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA2]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiclPU3AS4ll12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS2]], i64 [[CAST2]], i32 4, i32 0, i32 1) +//CHECK-LLVM: [[CAST3:%[0-9]+]] = bitcast double %desired to i64 +//CHECK-LLVM: [[LOAD3:%exp[0-9]+]] = load i64, ptr addrspace(4) [[EXPECTED]], align 8 +//CHECK-LLVM: store i64 [[LOAD3]], ptr [[EXPECTED_ALLOCA3:%expected[0-9]+]], align 8 +//CHECK-LLVM: [[EXPECTED_AS3:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA3]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiclPU3AS4ll12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS3]], i64 [[CAST3]], i32 3, i32 0, i32 2) +//CHECK-LLVM: [[CAST4:%[0-9]+]] = bitcast double %desired to i64 +//CHECK-LLVM: [[LOAD4:%exp[0-9]+]] = load i64, ptr addrspace(4) [[EXPECTED]], align 8 +//CHECK-LLVM: store i64 [[LOAD4]], ptr [[EXPECTED_ALLOCA4:%expected[0-9]+]], align 8 +//CHECK-LLVM: [[EXPECTED_AS4:%expected.*]] = addrspacecast ptr [[EXPECTED_ALLOCA4]] to ptr addrspace(4) +//CHECK-LLVM: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiclPU3AS4ll12memory_orderS4_12memory_scope(ptr addrspace(4) [[OBJECT]], ptr addrspace(4) [[EXPECTED_AS4]], i64 [[CAST4]], i32 4, i32 0, i32 1) diff --git a/llvm-spirv/test/transcoding/AtomicCompareExchange_cl20.ll b/llvm-spirv/test/transcoding/AtomicCompareExchange_cl20.ll index 98b59a7364c3b..97c598aa9e292 100644 --- a/llvm-spirv/test/transcoding/AtomicCompareExchange_cl20.ll +++ b/llvm-spirv/test/transcoding/AtomicCompareExchange_cl20.ll @@ -26,6 +26,24 @@ target triple = "spir-unknown-unknown" ; CHECK: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicit{{.*}}(ptr {{.*}} %object, ptr {{.*}} [[PTR_STRONG]].as, i32 %desired, i32 5, i32 5, i32 2) ; CHECK: load i32, ptr addrspace(4) [[PTR_STRONG]].as +; CHECK-LABEL: define spir_func void @test_strong_float +; CHECK-NEXT: entry: +; CHECK: [[PTR_STRONG:%expected[0-9]*]] = alloca i32, align 4 +; CHECK: [[DESIRED_CAST:%[0-9]*]] = bitcast float %desired to i32 +; CHECK: store i32 {{.*}}, ptr [[PTR_STRONG]] +; CHECK: [[PTR_STRONG]].as = addrspacecast ptr [[PTR_STRONG]] to ptr addrspace(4) +; CHECK: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicit{{.*}}(ptr {{.*}} %object, ptr {{.*}} [[PTR_STRONG]].as, i32 [[DESIRED_CAST]], i32 5, i32 5, i32 2) +; CHECK: load i32, ptr addrspace(4) [[PTR_STRONG]].as + +; CHECK-LABEL: define spir_func void @test_strong_double +; CHECK-NEXT: entry: +; CHECK: [[PTR_STRONG:%expected[0-9]*]] = alloca i64, align 8 +; CHECK: [[DESIRED_CAST:%[0-9]*]] = bitcast double %desired to i64 +; CHECK: store i64 {{.*}}, ptr [[PTR_STRONG]] +; CHECK: [[PTR_STRONG]].as = addrspacecast ptr [[PTR_STRONG]] to ptr addrspace(4) +; CHECK: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicit{{.*}}(ptr {{.*}} %object, ptr {{.*}} [[PTR_STRONG]].as, i64 [[DESIRED_CAST]], i32 5, i32 5, i32 2) +; CHECK: load i64, ptr addrspace(4) [[PTR_STRONG]].as + ; CHECK-LABEL: define spir_func void @test_weak ; CHECK-NEXT: entry: ; CHECK: [[PTR_WEAK:%expected[0-9]*]] = alloca i32, align 4 @@ -34,6 +52,24 @@ target triple = "spir-unknown-unknown" ; CHECK: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope{{.*}}(ptr {{.*}} %object, ptr {{.*}} [[PTR_WEAK]].as, i32 %desired, i32 5, i32 5, i32 2) ; CHECK: load i32, ptr addrspace(4) [[PTR_WEAK]].as +; CHECK-LABEL: define spir_func void @test_weak_float +; CHECK-NEXT: entry: +; CHECK: [[PTR_WEAK:%expected[0-9]*]] = alloca i32, align 4 +; CHECK: [[DESIRED_CAST:%[0-9]*]] = bitcast float %desired to i32 +; CHECK: store i32 {{.*}}, ptr [[PTR_WEAK]] +; CHECK: [[PTR_WEAK]].as = addrspacecast ptr [[PTR_WEAK]] to ptr addrspace(4) +; CHECK: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiciPU3AS4ii12memory_orderS4_12memory_scope(ptr {{.*}} %object, ptr {{.*}} [[PTR_WEAK]].as, i32 [[DESIRED_CAST]], i32 5, i32 5, i32 2) +; CHECK: load i32, ptr addrspace(4) [[PTR_WEAK]].as + +; CHECK-LABEL: define spir_func void @test_weak_double +; CHECK-NEXT: entry: +; CHECK: [[PTR_WEAK:%expected[0-9]*]] = alloca i64, align 8 +; CHECK: [[DESIRED_CAST:%[0-9]*]] = bitcast double %desired to i64 +; CHECK: store i64 {{.*}}, ptr [[PTR_WEAK]] +; CHECK: [[PTR_WEAK]].as = addrspacecast ptr [[PTR_WEAK]] to ptr addrspace(4) +; CHECK: call spir_func i1 @_Z39atomic_compare_exchange_strong_explicitPU3AS4VU7_AtomiclPU3AS4ll12memory_orderS4_12memory_scope(ptr {{.*}} %object, ptr {{.*}} [[PTR_WEAK]].as, i64 [[DESIRED_CAST]], i32 5, i32 5, i32 2) +; CHECK: load i64, ptr addrspace(4) [[PTR_WEAK]].as + ; Check that alloca for atomic_compare_exchange is being created in the entry block. ; CHECK-LABEL: @atomic_in_loop @@ -52,6 +88,22 @@ entry: declare spir_func zeroext i1 @_Z30atomic_compare_exchange_strongPVU3AS4U7_AtomiciPU3AS4ii(ptr addrspace(4), ptr addrspace(4), i32) #1 +define spir_func void @test_strong_float(ptr addrspace(4) %object, ptr addrspace(4) %expected, float %desired) #0 { +entry: + %call = call spir_func zeroext i1 @_Z30atomic_compare_exchange_strongPU3AS1VU7_AtomicfPU3AS1ff(ptr addrspace(4) %object, ptr addrspace(4) %expected, float %desired) #2 + ret void +} + +declare spir_func zeroext i1 @_Z30atomic_compare_exchange_strongPU3AS1VU7_AtomicfPU3AS1ff(ptr addrspace(4), ptr addrspace(4), float) + +define spir_func void @test_strong_double(ptr addrspace(4) %object, ptr addrspace(4) %expected, double %desired) #0 { +entry: + %call = call spir_func zeroext i1 @_Z30atomic_compare_exchange_strongPU3AS1VU7_AtomicdPU3AS1dd(ptr addrspace(4) %object, ptr addrspace(4) %expected, double %desired) #2 + ret void +} + +declare spir_func zeroext i1 @_Z30atomic_compare_exchange_strongPU3AS1VU7_AtomicdPU3AS1dd(ptr addrspace(4), ptr addrspace(4), double) + ; Function Attrs: nounwind define spir_func void @test_weak(ptr addrspace(4) %object, ptr addrspace(4) %expected, i32 %desired) #0 { entry: @@ -61,6 +113,22 @@ entry: declare spir_func zeroext i1 @_Z28atomic_compare_exchange_weakPVU3AS4U7_AtomiciPU3AS4ii(ptr addrspace(4), ptr addrspace(4), i32) #1 +define spir_func void @test_weak_float(ptr addrspace(4) %object, ptr addrspace(4) %expected, float %desired) #0 { +entry: + %call = call spir_func zeroext i1 @_Z28atomic_compare_exchange_weakPU3AS1VU7_AtomicfPU3AS1ff(ptr addrspace(4) %object, ptr addrspace(4) %expected, float %desired) #2 + ret void +} + +declare spir_func zeroext i1 @_Z28atomic_compare_exchange_weakPU3AS1VU7_AtomicfPU3AS1ff(ptr addrspace(4), ptr addrspace(4), float) + +define spir_func void @test_weak_double(ptr addrspace(4) %object, ptr addrspace(4) %expected, double %desired) #0 { +entry: + %call = call spir_func zeroext i1 @_Z28atomic_compare_exchange_weakPU3AS1VU7_AtomicdPU3AS1dd(ptr addrspace(4) %object, ptr addrspace(4) %expected, double %desired) #2 + ret void +} + +declare spir_func zeroext i1 @_Z28atomic_compare_exchange_weakPU3AS1VU7_AtomicdPU3AS1dd(ptr addrspace(4), ptr addrspace(4), double) + ; Function Attrs: nounwind define spir_kernel void @atomic_in_loop(ptr addrspace(1) %destMemory, ptr addrspace(1) %oldValues) #0 { entry: