
Set the writable and dead_on_unwind attributes for sret arguments. These indicate that the argument points to writable memory (and it's legal to introduce spurious writes to it on entry to the function) and that the argument memory will not be used if the call unwinds. This enables additional MemCpyOpt/DSE/LICM optimizations.
167 lines
8.3 KiB
C
167 lines
8.3 KiB
C
// RUN: %clang_cc1 -msoft-float -mfloat-abi soft -triple powerpc64le-unknown-linux-gnu -emit-llvm -o - %s | FileCheck -check-prefix=CHECK -check-prefix=CHECK-LE %s
|
|
// RUN: %clang_cc1 -msoft-float -mfloat-abi soft -triple powerpc64-unknown-linux-gnu -emit-llvm -o - %s | FileCheck -check-prefix=CHECK -check-prefix=CHECK-BE %s
|
|
|
|
// Test float returns and params.
|
|
|
|
// CHECK: define{{.*}} float @func_p1(float noundef %x)
|
|
float func_p1(float x) { return x; }
|
|
|
|
// CHECK: define{{.*}} double @func_p2(double noundef %x)
|
|
double func_p2(double x) { return x; }
|
|
|
|
// CHECK: define{{.*}} ppc_fp128 @func_p3(ppc_fp128 noundef %x)
|
|
long double func_p3(long double x) { return x; }
|
|
|
|
// Test homogeneous float aggregate passing and returning.
|
|
|
|
struct f1 { float f[1]; };
|
|
struct f2 { float f[2]; };
|
|
struct f3 { float f[3]; };
|
|
struct f4 { float f[4]; };
|
|
struct f5 { float f[5]; };
|
|
struct f6 { float f[6]; };
|
|
struct f7 { float f[7]; };
|
|
struct f8 { float f[8]; };
|
|
struct f9 { float f[9]; };
|
|
|
|
struct fab { float a; float b; };
|
|
struct fabc { float a; float b; float c; };
|
|
|
|
struct f2a2b { float a[2]; float b[2]; };
|
|
|
|
// CHECK-LE: define{{.*}} i32 @func_f1(float inreg %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_f1(ptr dead_on_unwind noalias writable sret(%struct.f1) align 4 %agg.result, float inreg %x.coerce)
|
|
struct f1 func_f1(struct f1 x) { return x; }
|
|
|
|
// CHECK-LE: define{{.*}} i64 @func_f2(i64 %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_f2(ptr dead_on_unwind noalias writable sret(%struct.f2) align 4 %agg.result, i64 %x.coerce)
|
|
struct f2 func_f2(struct f2 x) { return x; }
|
|
|
|
// CHECK-LE: define{{.*}} { i64, i64 } @func_f3([2 x i64] %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_f3(ptr dead_on_unwind noalias writable sret(%struct.f3) align 4 %agg.result, [2 x i64] %x.coerce)
|
|
struct f3 func_f3(struct f3 x) { return x; }
|
|
|
|
// CHECK-LE: define{{.*}} { i64, i64 } @func_f4([2 x i64] %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_f4(ptr dead_on_unwind noalias writable sret(%struct.f4) align 4 %agg.result, [2 x i64] %x.coerce)
|
|
struct f4 func_f4(struct f4 x) { return x; }
|
|
|
|
// CHECK: define{{.*}} void @func_f5(ptr dead_on_unwind noalias writable sret(%struct.f5) align 4 %agg.result, [3 x i64] %x.coerce)
|
|
struct f5 func_f5(struct f5 x) { return x; }
|
|
|
|
// CHECK: define{{.*}} void @func_f6(ptr dead_on_unwind noalias writable sret(%struct.f6) align 4 %agg.result, [3 x i64] %x.coerce)
|
|
struct f6 func_f6(struct f6 x) { return x; }
|
|
|
|
// CHECK: define{{.*}} void @func_f7(ptr dead_on_unwind noalias writable sret(%struct.f7) align 4 %agg.result, [4 x i64] %x.coerce)
|
|
struct f7 func_f7(struct f7 x) { return x; }
|
|
|
|
// CHECK: define{{.*}} void @func_f8(ptr dead_on_unwind noalias writable sret(%struct.f8) align 4 %agg.result, [4 x i64] %x.coerce)
|
|
struct f8 func_f8(struct f8 x) { return x; }
|
|
|
|
// CHECK: define{{.*}} void @func_f9(ptr dead_on_unwind noalias writable sret(%struct.f9) align 4 %agg.result, [5 x i64] %x.coerce)
|
|
struct f9 func_f9(struct f9 x) { return x; }
|
|
|
|
// CHECK-LE: define{{.*}} i64 @func_fab(i64 %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_fab(ptr dead_on_unwind noalias writable sret(%struct.fab) align 4 %agg.result, i64 %x.coerce)
|
|
struct fab func_fab(struct fab x) { return x; }
|
|
|
|
// CHECK-LE: define{{.*}} { i64, i64 } @func_fabc([2 x i64] %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_fabc(ptr dead_on_unwind noalias writable sret(%struct.fabc) align 4 %agg.result, [2 x i64] %x.coerce)
|
|
struct fabc func_fabc(struct fabc x) { return x; }
|
|
|
|
// CHECK-LE: define{{.*}} { i64, i64 } @func_f2a2b([2 x i64] %x.coerce)
|
|
// CHECK-BE: define{{.*}} void @func_f2a2b(ptr dead_on_unwind noalias writable sret(%struct.f2a2b) align 4 %agg.result, [2 x i64] %x.coerce)
|
|
struct f2a2b func_f2a2b(struct f2a2b x) { return x; }
|
|
|
|
// CHECK-LABEL: @call_f1
|
|
// CHECK-BE: %[[TMP0:[^ ]+]] = alloca %struct.f1, align 4
|
|
// CHECK: %[[TMP:[^ ]+]] = load float, ptr @global_f1, align 4
|
|
// CHECK-LE: call i32 @func_f1(float inreg %[[TMP]])
|
|
// CHECK-BE: call void @func_f1(ptr dead_on_unwind writable sret(%struct.f1) align 4 %[[TMP0]], float inreg %[[TMP]])
|
|
struct f1 global_f1;
|
|
void call_f1(void) { global_f1 = func_f1(global_f1); }
|
|
|
|
// CHECK-LABEL: @call_f2
|
|
// CHECK-BE: %[[TMP0:[^ ]+]] = alloca %struct.f2, align 4
|
|
// CHECK: %[[TMP:[^ ]+]] = load i64, ptr @global_f2, align 4
|
|
// CHECK-LE: call i64 @func_f2(i64 %[[TMP]])
|
|
// CHECK-BE: call void @func_f2(ptr dead_on_unwind writable sret(%struct.f2) align 4 %[[TMP0]], i64 %[[TMP]])
|
|
struct f2 global_f2;
|
|
void call_f2(void) { global_f2 = func_f2(global_f2); }
|
|
|
|
// CHECK-LABEL: @call_f3
|
|
// CHECK-BE: %[[TMP0:[^ ]+]] = alloca %struct.f3, align 4
|
|
// CHECK: %[[TMP1:[^ ]+]] = alloca [2 x i64]
|
|
// CHECK: call void @llvm.memcpy.p0.p0.i64(ptr align 8 %[[TMP1]], ptr align 4 @global_f3, i64 12, i1 false)
|
|
// CHECK: %[[TMP3:[^ ]+]] = load [2 x i64], ptr %[[TMP1]]
|
|
// CHECK-LE: call { i64, i64 } @func_f3([2 x i64] %[[TMP3]])
|
|
// CHECK-BE: call void @func_f3(ptr dead_on_unwind writable sret(%struct.f3) align 4 %[[TMP0]], [2 x i64] %[[TMP3]])
|
|
struct f3 global_f3;
|
|
void call_f3(void) { global_f3 = func_f3(global_f3); }
|
|
|
|
// CHECK-LABEL: @call_f4
|
|
// CHECK-BE: %[[TMP0:[^ ]+]] = alloca %struct.f4, align 4
|
|
// CHECK: %[[TMP:[^ ]+]] = load [2 x i64], ptr @global_f4, align 4
|
|
// CHECK-LE: call { i64, i64 } @func_f4([2 x i64] %[[TMP]])
|
|
// CHECK-BE: call void @func_f4(ptr dead_on_unwind writable sret(%struct.f4) align 4 %[[TMP0]], [2 x i64] %[[TMP]])
|
|
struct f4 global_f4;
|
|
void call_f4(void) { global_f4 = func_f4(global_f4); }
|
|
|
|
// CHECK-LABEL: @call_f5
|
|
// CHECK: %[[TMP0:[^ ]+]] = alloca %struct.f5, align 4
|
|
// CHECK: %[[TMP1:[^ ]+]] = alloca [3 x i64]
|
|
// CHECK: call void @llvm.memcpy.p0.p0.i64(ptr align 8 %[[TMP1]], ptr align 4 @global_f5, i64 20, i1 false)
|
|
// CHECK: %[[TMP3:[^ ]+]] = load [3 x i64], ptr %[[TMP1]]
|
|
// CHECK: call void @func_f5(ptr dead_on_unwind writable sret(%struct.f5) align 4 %[[TMP0]], [3 x i64] %[[TMP3]])
|
|
struct f5 global_f5;
|
|
void call_f5(void) { global_f5 = func_f5(global_f5); }
|
|
|
|
// CHECK-LABEL: @call_f6
|
|
// CHECK: %[[TMP0:[^ ]+]] = alloca %struct.f6, align 4
|
|
// CHECK: %[[TMP:[^ ]+]] = load [3 x i64], ptr @global_f6, align 4
|
|
// CHECK: call void @func_f6(ptr dead_on_unwind writable sret(%struct.f6) align 4 %[[TMP0]], [3 x i64] %[[TMP]])
|
|
struct f6 global_f6;
|
|
void call_f6(void) { global_f6 = func_f6(global_f6); }
|
|
|
|
// CHECK-LABEL: @call_f7
|
|
// CHECK: %[[TMP0:[^ ]+]] = alloca %struct.f7, align 4
|
|
// CHECK: %[[TMP1:[^ ]+]] = alloca [4 x i64], align 8
|
|
// CHECK: call void @llvm.memcpy.p0.p0.i64(ptr align 8 %[[TMP1]], ptr align 4 @global_f7, i64 28, i1 false)
|
|
// CHECK: %[[TMP3:[^ ]+]] = load [4 x i64], ptr %[[TMP1]], align 8
|
|
// CHECK: call void @func_f7(ptr dead_on_unwind writable sret(%struct.f7) align 4 %[[TMP0]], [4 x i64] %[[TMP3]])
|
|
struct f7 global_f7;
|
|
void call_f7(void) { global_f7 = func_f7(global_f7); }
|
|
|
|
// CHECK-LABEL: @call_f8
|
|
// CHECK: %[[TMP0:[^ ]+]] = alloca %struct.f8, align 4
|
|
// CHECK: %[[TMP:[^ ]+]] = load [4 x i64], ptr @global_f8, align 4
|
|
// CHECK: call void @func_f8(ptr dead_on_unwind writable sret(%struct.f8) align 4 %[[TMP0]], [4 x i64] %[[TMP]])
|
|
struct f8 global_f8;
|
|
void call_f8(void) { global_f8 = func_f8(global_f8); }
|
|
|
|
// CHECK-LABEL: @call_f9
|
|
// CHECK: %[[TMP1:[^ ]+]] = alloca [5 x i64]
|
|
// CHECK: call void @llvm.memcpy.p0.p0.i64(ptr align 8 %[[TMP1]], ptr align 4 @global_f9, i64 36, i1 false)
|
|
// CHECK: %[[TMP3:[^ ]+]] = load [5 x i64], ptr %[[TMP1]]
|
|
// CHECK: call void @func_f9(ptr dead_on_unwind writable sret(%struct.f9) align 4 %{{[^ ]+}}, [5 x i64] %[[TMP3]])
|
|
struct f9 global_f9;
|
|
void call_f9(void) { global_f9 = func_f9(global_f9); }
|
|
|
|
// CHECK-LABEL: @call_fab
|
|
// CHECK: %[[TMP0:[^ ]+]] = alloca %struct.fab, align 4
|
|
// CHECK: %[[TMP:[^ ]+]] = load i64, ptr @global_fab, align 4
|
|
// CHECK-LE: %call = call i64 @func_fab(i64 %[[TMP]])
|
|
// CHECK-BE: call void @func_fab(ptr dead_on_unwind writable sret(%struct.fab) align 4 %[[TMP0]], i64 %[[TMP]])
|
|
struct fab global_fab;
|
|
void call_fab(void) { global_fab = func_fab(global_fab); }
|
|
|
|
// CHECK-LABEL: @call_fabc
|
|
// CHECK-BE: %[[TMPX:[^ ]+]] = alloca %struct.fabc, align 4
|
|
// CHECK: %[[TMP0:[^ ]+]] = alloca [2 x i64], align 8
|
|
// CHECK: call void @llvm.memcpy.p0.p0.i64(ptr align 8 %[[TMP0]], ptr align 4 @global_fabc, i64 12, i1 false)
|
|
// CHECK: %[[TMP3:[^ ]+]] = load [2 x i64], ptr %[[TMP0]], align 8
|
|
// CHECK-LE: %call = call { i64, i64 } @func_fabc([2 x i64] %[[TMP3]])
|
|
// CHECK-BE: call void @func_fabc(ptr dead_on_unwind writable sret(%struct.fabc) align 4 %[[TMPX]], [2 x i64] %[[TMP3]])
|
|
struct fabc global_fabc;
|
|
void call_fabc(void) { global_fabc = func_fabc(global_fabc); }
|
|
|