
This is intended to solve a problem with lowering atomics in OpenMP and C++ common to AMDGPU and NVPTX. In OpenCL and CUDA, it is undefined behavior for an atomic instruction to modify an object in thread private memory. In OpenMP, it is defined. Correspondingly, the hardware does not handle this correctly. For AMDGPU, 32-bit atomics work and 64-bit atomics are silently dropped. We therefore need to codegen this by inserting a runtime address space check, performing the private case without atomics, and fallback to issuing the real atomic otherwise. This metadata allows us to avoid this extra check and branch. Handle this by introducing metadata intended to be applied to atomicrmw, indicating they cannot access the forbidden address space.
61 lines
1.8 KiB
LLVM
61 lines
1.8 KiB
LLVM
; RUN: not llvm-as < %s -o /dev/null 2>&1 | FileCheck %s
|
|
|
|
; CHECK: It should have at least one range!
|
|
; CHECK-NEXT: !0 = !{}
|
|
define i64 @noalias_addrspace__empty(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !0
|
|
ret i64 %ret
|
|
}
|
|
|
|
; CHECK: Unfinished range!
|
|
; CHECK-NEXT: !1 = !{i32 0}
|
|
define i64 @noalias_addrspace__single_field(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !1
|
|
ret i64 %ret
|
|
}
|
|
|
|
; CHECK: Range must not be empty!
|
|
; CHECK-NEXT: !2 = !{i32 0, i32 0}
|
|
define i64 @noalias_addrspace__0_0(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !2
|
|
ret i64 %ret
|
|
}
|
|
|
|
; CHECK: noalias.addrspace type must be i32!
|
|
; CHECK-NEXT: %ret = atomicrmw add ptr %ptr, i64 %val seq_cst, align 8, !noalias.addrspace !3
|
|
define i64 @noalias_addrspace__i64(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !3
|
|
ret i64 %ret
|
|
}
|
|
|
|
; CHECK: The lower limit must be an integer!
|
|
define i64 @noalias_addrspace__fp(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !4
|
|
ret i64 %ret
|
|
}
|
|
|
|
; CHECK: The lower limit must be an integer!
|
|
define i64 @noalias_addrspace__ptr(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !5
|
|
ret i64 %ret
|
|
}
|
|
|
|
; CHECK: The lower limit must be an integer!
|
|
define i64 @noalias_addrspace__nonconstant(ptr %ptr, i64 %val) {
|
|
%ret = atomicrmw add ptr %ptr, i64 %val seq_cst, !noalias.addrspace !6
|
|
ret i64 %ret
|
|
}
|
|
|
|
@gv0 = global i32 0
|
|
@gv1 = global i32 1
|
|
|
|
!0 = !{}
|
|
!1 = !{i32 0}
|
|
!2 = !{i32 0, i32 0}
|
|
!3 = !{i64 1, i64 5}
|
|
!4 = !{float 0.0, float 2.0}
|
|
!5 = !{ptr null, ptr addrspace(1) null}
|
|
!6 = !{i32 ptrtoint (ptr @gv0 to i32), i32 ptrtoint (ptr @gv1 to i32) }
|
|
|
|
|