
Now that #149310 has restricted lifetime intrinsics to only work on allocas, we can also drop the explicit size argument. Instead, the size is implied by the alloca. This removes the ability to only mark a prefix of an alloca alive/dead. We never used that capability, so we should remove the need to handle that possibility everywhere (though many key places, including stack coloring, did not actually respect this).
150 lines
7.4 KiB
LLVM
150 lines
7.4 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt < %s -passes='sroa<preserve-cfg>' -S | FileCheck %s --check-prefixes=CHECK,CHECK-PRESERVE-CFG
|
|
; RUN: opt < %s -passes='sroa<modify-cfg>' -S | FileCheck %s --check-prefixes=CHECK,CHECK-MODIFY-CFG
|
|
target datalayout = "e-p:64:64:64-p1:16:16:16-p2:32:32-p3:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-n8:16:32:64-A2"
|
|
|
|
declare void @llvm.memcpy.p2.p2.i32(ptr addrspace(2) nocapture, ptr addrspace(2) nocapture readonly, i32, i1)
|
|
declare void @llvm.memcpy.p1.p2.i32(ptr addrspace(1) nocapture, ptr addrspace(2) nocapture readonly, i32, i1)
|
|
declare void @llvm.memcpy.p2.p1.i32(ptr addrspace(2) nocapture, ptr addrspace(1) nocapture readonly, i32, i1)
|
|
declare void @llvm.memcpy.p1.p1.i32(ptr addrspace(1) nocapture, ptr addrspace(1) nocapture readonly, i32, i1)
|
|
|
|
|
|
define void @test_address_space_1_1(ptr addrspace(1) %a, ptr addrspace(1) %b) {
|
|
; CHECK-LABEL: @test_address_space_1_1(
|
|
; CHECK-NEXT: [[AA_0_COPYLOAD:%.*]] = load <2 x i64>, ptr addrspace(1) [[A:%.*]], align 2
|
|
; CHECK-NEXT: store <2 x i64> [[AA_0_COPYLOAD]], ptr addrspace(1) [[B:%.*]], align 2
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
%aa = alloca <2 x i64>, align 16, addrspace(2)
|
|
call void @llvm.memcpy.p2.p1.i32(ptr addrspace(2) align 2 %aa, ptr addrspace(1) align 2 %a, i32 16, i1 false)
|
|
call void @llvm.memcpy.p1.p2.i32(ptr addrspace(1) align 2 %b, ptr addrspace(2) align 2 %aa, i32 16, i1 false)
|
|
ret void
|
|
}
|
|
|
|
define void @test_address_space_1_0(ptr addrspace(1) %a, ptr addrspace(2) %b) {
|
|
; CHECK-LABEL: @test_address_space_1_0(
|
|
; CHECK-NEXT: [[AA_0_COPYLOAD:%.*]] = load <2 x i64>, ptr addrspace(1) [[A:%.*]], align 2
|
|
; CHECK-NEXT: store <2 x i64> [[AA_0_COPYLOAD]], ptr addrspace(2) [[B:%.*]], align 2
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
%aa = alloca <2 x i64>, align 16, addrspace(2)
|
|
call void @llvm.memcpy.p2.p1.i32(ptr addrspace(2) align 2 %aa, ptr addrspace(1) align 2 %a, i32 16, i1 false)
|
|
call void @llvm.memcpy.p2.p2.i32(ptr addrspace(2) align 2 %b, ptr addrspace(2) align 2 %aa, i32 16, i1 false)
|
|
ret void
|
|
}
|
|
|
|
define void @test_address_space_0_1(ptr addrspace(2) %a, ptr addrspace(1) %b) {
|
|
; CHECK-LABEL: @test_address_space_0_1(
|
|
; CHECK-NEXT: [[AA_0_COPYLOAD:%.*]] = load <2 x i64>, ptr addrspace(2) [[A:%.*]], align 2
|
|
; CHECK-NEXT: store <2 x i64> [[AA_0_COPYLOAD]], ptr addrspace(1) [[B:%.*]], align 2
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
%aa = alloca <2 x i64>, align 16, addrspace(2)
|
|
call void @llvm.memcpy.p2.p2.i32(ptr addrspace(2) align 2 %aa, ptr addrspace(2) align 2 %a, i32 16, i1 false)
|
|
call void @llvm.memcpy.p1.p2.i32(ptr addrspace(1) align 2 %b, ptr addrspace(2) align 2 %aa, i32 16, i1 false)
|
|
ret void
|
|
}
|
|
|
|
%struct.struct_test_27.0.13 = type { i32, float, i64, i8, [4 x i32] }
|
|
|
|
define void @copy_struct([5 x i64] %in.coerce, ptr addrspace(1) align 4 %ptr) {
|
|
; CHECK-LABEL: @copy_struct(
|
|
; CHECK-NEXT: for.end:
|
|
; CHECK-NEXT: [[IN_COERCE_FCA_0_EXTRACT:%.*]] = extractvalue [5 x i64] [[IN_COERCE:%.*]], 0
|
|
; CHECK-NEXT: [[IN_COERCE_FCA_1_EXTRACT:%.*]] = extractvalue [5 x i64] [[IN_COERCE]], 1
|
|
; CHECK-NEXT: [[IN_COERCE_FCA_2_EXTRACT:%.*]] = extractvalue [5 x i64] [[IN_COERCE]], 2
|
|
; CHECK-NEXT: [[IN_COERCE_FCA_3_EXTRACT:%.*]] = extractvalue [5 x i64] [[IN_COERCE]], 3
|
|
; CHECK-NEXT: [[IN_SROA_2_4_EXTRACT_SHIFT:%.*]] = lshr i64 [[IN_COERCE_FCA_2_EXTRACT]], 32
|
|
; CHECK-NEXT: [[IN_SROA_2_4_EXTRACT_TRUNC:%.*]] = trunc i64 [[IN_SROA_2_4_EXTRACT_SHIFT]] to i32
|
|
; CHECK-NEXT: store i32 [[IN_SROA_2_4_EXTRACT_TRUNC]], ptr addrspace(1) [[PTR:%.*]], align 4
|
|
; CHECK-NEXT: [[IN_SROA_4_20_PTR_SROA_IDX:%.*]] = getelementptr inbounds i8, ptr addrspace(1) [[PTR]], i16 4
|
|
; CHECK-NEXT: store i64 [[IN_COERCE_FCA_3_EXTRACT]], ptr addrspace(1) [[IN_SROA_4_20_PTR_SROA_IDX]], align 4
|
|
; CHECK-NEXT: [[IN_SROA_5_20_PTR_SROA_IDX:%.*]] = getelementptr inbounds i8, ptr addrspace(1) [[PTR]], i16 12
|
|
; CHECK-NEXT: store i32 undef, ptr addrspace(1) [[IN_SROA_5_20_PTR_SROA_IDX]], align 4
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
for.end:
|
|
%in = alloca %struct.struct_test_27.0.13, align 8, addrspace(2)
|
|
store [5 x i64] %in.coerce, ptr addrspace(2) %in, align 8
|
|
%scevgep9 = getelementptr %struct.struct_test_27.0.13, ptr addrspace(2) %in, i32 0, i32 4, i32 0
|
|
call void @llvm.memcpy.p1.p2.i32(ptr addrspace(1) align 4 %ptr, ptr addrspace(2) align 4 %scevgep9, i32 16, i1 false)
|
|
ret void
|
|
}
|
|
|
|
%union.anon = type { ptr }
|
|
|
|
@g = common global i32 0, align 4
|
|
@l = common addrspace(3) global i32 0, align 4
|
|
|
|
; If pointers from different address spaces have different sizes, make sure an
|
|
; illegal bitcast isn't introduced
|
|
define void @pr27557() {
|
|
; CHECK-LABEL: @pr27557(
|
|
; CHECK-NEXT: [[DOTSROA_0:%.*]] = alloca ptr, align 8, addrspace(2)
|
|
; CHECK-NEXT: store ptr @g, ptr addrspace(2) [[DOTSROA_0]], align 8
|
|
; CHECK-NEXT: store ptr addrspace(3) @l, ptr addrspace(2) [[DOTSROA_0]], align 8
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
%1 = alloca %union.anon, align 8, addrspace(2)
|
|
store ptr @g, ptr addrspace(2) %1, align 8
|
|
store ptr addrspace(3) @l, ptr addrspace(2) %1, align 8
|
|
ret void
|
|
}
|
|
|
|
@l4 = common addrspace(4) global i32 0, align 4
|
|
|
|
; If pointers from different address spaces have the same size, that pointer
|
|
; should be promoted through the pair of `ptrtoint`/`inttoptr`.
|
|
define ptr @pr27557.alt() {
|
|
; CHECK-LABEL: @pr27557.alt(
|
|
; CHECK-NEXT: ret ptr inttoptr (i64 ptrtoint (ptr addrspace(4) @l4 to i64) to ptr)
|
|
;
|
|
%1 = alloca %union.anon, align 8, addrspace(2)
|
|
store ptr addrspace(4) @l4, ptr addrspace(2) %1, align 8
|
|
%2 = load ptr, ptr addrspace(2) %1, align 8
|
|
ret ptr %2
|
|
}
|
|
|
|
; Test load from and store to non-zero address space.
|
|
define void @test_load_store_diff_addr_space(ptr addrspace(1) %complex1, ptr addrspace(1) %complex2) {
|
|
; CHECK-LABEL: @test_load_store_diff_addr_space(
|
|
; CHECK-NEXT: [[V13:%.*]] = load i32, ptr addrspace(1) [[COMPLEX1:%.*]], align 4
|
|
; CHECK-NEXT: [[COMPLEX1_SROA_IDX:%.*]] = getelementptr inbounds i8, ptr addrspace(1) [[COMPLEX1]], i16 4
|
|
; CHECK-NEXT: [[V14:%.*]] = load i32, ptr addrspace(1) [[COMPLEX1_SROA_IDX]], align 4
|
|
; CHECK-NEXT: [[TMP1:%.*]] = bitcast i32 [[V13]] to float
|
|
; CHECK-NEXT: [[TMP2:%.*]] = bitcast i32 [[V14]] to float
|
|
; CHECK-NEXT: [[SUM:%.*]] = fadd float [[TMP1]], [[TMP2]]
|
|
; CHECK-NEXT: [[TMP3:%.*]] = bitcast float [[SUM]] to i32
|
|
; CHECK-NEXT: [[TMP4:%.*]] = bitcast float [[SUM]] to i32
|
|
; CHECK-NEXT: store i32 [[TMP3]], ptr addrspace(1) [[COMPLEX2:%.*]], align 4
|
|
; CHECK-NEXT: [[COMPLEX2_SROA_IDX:%.*]] = getelementptr inbounds i8, ptr addrspace(1) [[COMPLEX2]], i16 4
|
|
; CHECK-NEXT: store i32 [[TMP4]], ptr addrspace(1) [[COMPLEX2_SROA_IDX]], align 4
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
%a0 = alloca [2 x i64], align 8, addrspace(2)
|
|
%a.gep2 = getelementptr [2 x float], ptr addrspace(2) %a0, i32 0, i32 1
|
|
%v1 = load i64, ptr addrspace(1) %complex1
|
|
store i64 %v1, ptr addrspace(2) %a0
|
|
%f1 = load float, ptr addrspace(2) %a0
|
|
%f2 = load float, ptr addrspace(2) %a.gep2
|
|
%sum = fadd float %f1, %f2
|
|
store float %sum, ptr addrspace(2) %a0
|
|
store float %sum, ptr addrspace(2) %a.gep2
|
|
%v2 = load i64, ptr addrspace(2) %a0
|
|
store i64 %v2, ptr addrspace(1) %complex2
|
|
ret void
|
|
}
|
|
|
|
define void @addressspace_alloca_lifetime() {
|
|
; CHECK-LABEL: @addressspace_alloca_lifetime(
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
%alloca = alloca i8, align 8, addrspace(2)
|
|
call void @llvm.lifetime.start(ptr addrspace(2) %alloca)
|
|
ret void
|
|
}
|
|
|
|
;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
|
|
; CHECK-MODIFY-CFG: {{.*}}
|
|
; CHECK-PRESERVE-CFG: {{.*}}
|