[AMDGPU] Remove explicit datalayout from tests where not needed
Since e39f6c1844fab59c638d8059a6cf139adb42279a opt will infer the correct datalayout when given a triple. Avoid explicitly specifying it in tests that depend on the AMDGPU target being present to avoid the string becoming out of sync with the TargetInfo value. Only tests with REQUIRES: amdgpu-registered-target or a local lit.cfg were updated to ensure that tests for non-target-specific passes that happen to use the AMDGPU layout still pass when building with a limited set of targets. Reviewed By: shiltian, arsenm Pull Request: https://github.com/llvm/llvm-project/pull/137921
This commit is contained in:
parent
c02496901d
commit
ee13638362
@ -6,7 +6,6 @@
|
|||||||
; RUN: -disable-output %s 2>&1 | \
|
; RUN: -disable-output %s 2>&1 | \
|
||||||
; RUN: FileCheck -match-full-lines %s
|
; RUN: FileCheck -match-full-lines %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
; CHECK: remark: test.c:10:0: in artificial function 'all', omp_target_num_teams = 100
|
; CHECK: remark: test.c:10:0: in artificial function 'all', omp_target_num_teams = 100
|
||||||
|
@ -81,7 +81,6 @@
|
|||||||
|
|
||||||
; ModuleID = 'test-openmp-amdgcn-amd-amdhsa-gfx906.bc'
|
; ModuleID = 'test-openmp-amdgcn-amd-amdhsa-gfx906.bc'
|
||||||
source_filename = "test.c"
|
source_filename = "test.c"
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
%struct.ident_t = type { i32, i32, i32, i32, ptr }
|
%struct.ident_t = type { i32, i32, i32, i32, ptr }
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -passes=amdgpu-promote-alloca < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -passes=amdgpu-promote-alloca < %s | FileCheck %s
|
||||||
; Nothing should be done if the addrspacecast is captured.
|
; Nothing should be done if the addrspacecast is captured.
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
declare void @consume_ptr2int(i32) #0
|
declare void @consume_ptr2int(i32) #0
|
||||||
|
|
||||||
; CHECK-LABEL: @addrspacecast_captured(
|
; CHECK-LABEL: @addrspacecast_captured(
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4ceilf(float)
|
declare float @_Z4ceilf(float)
|
||||||
declare <2 x float> @_Z4ceilDv2_f(<2 x float>)
|
declare <2 x float> @_Z4ceilDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z4ceilDv3_f(<3 x float>)
|
declare <3 x float> @_Z4ceilDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z8copysignff(float, float)
|
declare float @_Z8copysignff(float, float)
|
||||||
declare <2 x float> @_Z8copysignDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z8copysignDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z8copysignDv3_fS_(<3 x float>, <3 x float>)
|
declare <3 x float> @_Z8copysignDv3_fS_(<3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3expf(float)
|
declare float @_Z3expf(float)
|
||||||
declare <2 x float> @_Z3expDv2_f(<2 x float>)
|
declare <2 x float> @_Z3expDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z3expDv3_f(<3 x float>)
|
declare <3 x float> @_Z3expDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4exp2f(float)
|
declare float @_Z4exp2f(float)
|
||||||
declare <2 x float> @_Z4exp2Dv2_f(<2 x float>)
|
declare <2 x float> @_Z4exp2Dv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z4exp2Dv3_f(<3 x float>)
|
declare <3 x float> @_Z4exp2Dv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4fabsf(float)
|
declare float @_Z4fabsf(float)
|
||||||
declare <2 x float> @_Z4fabsDv2_f(<2 x float>)
|
declare <2 x float> @_Z4fabsDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z4fabsDv3_f(<3 x float>)
|
declare <3 x float> @_Z4fabsDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z5floorf(float)
|
declare float @_Z5floorf(float)
|
||||||
declare <2 x float> @_Z5floorDv2_f(<2 x float>)
|
declare <2 x float> @_Z5floorDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z5floorDv3_f(<3 x float>)
|
declare <3 x float> @_Z5floorDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3fmafff(float, float, float)
|
declare float @_Z3fmafff(float, float, float)
|
||||||
declare <2 x float> @_Z3fmaDv2_fS_S_(<2 x float>, <2 x float>, <2 x float>)
|
declare <2 x float> @_Z3fmaDv2_fS_S_(<2 x float>, <2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z3fmaDv3_fS_S_(<3 x float>, <3 x float>, <3 x float>)
|
declare <3 x float> @_Z3fmaDv3_fS_S_(<3 x float>, <3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare <2 x float> @_Z4fmaxDv2_ff(<2 x float>, float)
|
declare <2 x float> @_Z4fmaxDv2_ff(<2 x float>, float)
|
||||||
declare <2 x float> @_Z4fmaxDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z4fmaxDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z4fmaxDv3_ff(<3 x float>, float)
|
declare <3 x float> @_Z4fmaxDv3_ff(<3 x float>, float)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4fmaxff(float, float)
|
declare float @_Z4fmaxff(float, float)
|
||||||
declare <2 x float> @_Z4fmaxDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z4fmaxDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z4fmaxDv3_fS_(<3 x float>, <3 x float>)
|
declare <3 x float> @_Z4fmaxDv3_fS_(<3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare <2 x float> @_Z4fminDv2_ff(<2 x float>, float)
|
declare <2 x float> @_Z4fminDv2_ff(<2 x float>, float)
|
||||||
declare <2 x float> @_Z4fminDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z4fminDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z4fminDv3_ff(<3 x float>, float)
|
declare <3 x float> @_Z4fminDv3_ff(<3 x float>, float)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4fminff(float, float)
|
declare float @_Z4fminff(float, float)
|
||||||
declare <2 x float> @_Z4fminDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z4fminDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z4fminDv3_fS_(<3 x float>, <3 x float>)
|
declare <3 x float> @_Z4fminDv3_fS_(<3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare <2 x float> @_Z5ldexpDv2_fi(<2 x float>, i32)
|
declare <2 x float> @_Z5ldexpDv2_fi(<2 x float>, i32)
|
||||||
declare <3 x float> @_Z5ldexpDv3_fi(<3 x float>, i32)
|
declare <3 x float> @_Z5ldexpDv3_fi(<3 x float>, i32)
|
||||||
declare <4 x float> @_Z5ldexpDv4_fi(<4 x float>, i32)
|
declare <4 x float> @_Z5ldexpDv4_fi(<4 x float>, i32)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z5ldexpfi(float, i32)
|
declare float @_Z5ldexpfi(float, i32)
|
||||||
declare <2 x float> @_Z5ldexpDv2_fDv2_i(<2 x float>, <2 x i32>)
|
declare <2 x float> @_Z5ldexpDv2_fDv2_i(<2 x float>, <2 x i32>)
|
||||||
declare <3 x float> @_Z5ldexpDv3_fDv3_i(<3 x float>, <3 x i32>)
|
declare <3 x float> @_Z5ldexpDv3_fDv3_i(<3 x float>, <3 x i32>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3logf(float)
|
declare float @_Z3logf(float)
|
||||||
declare <2 x float> @_Z3logDv2_f(<2 x float>)
|
declare <2 x float> @_Z3logDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z3logDv3_f(<3 x float>)
|
declare <3 x float> @_Z3logDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z5log10f(float)
|
declare float @_Z5log10f(float)
|
||||||
declare <2 x float> @_Z5log10Dv2_f(<2 x float>)
|
declare <2 x float> @_Z5log10Dv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z5log10Dv3_f(<3 x float>)
|
declare <3 x float> @_Z5log10Dv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4log2f(float)
|
declare float @_Z4log2f(float)
|
||||||
declare <2 x float> @_Z4log2Dv2_f(<2 x float>)
|
declare <2 x float> @_Z4log2Dv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z4log2Dv3_f(<3 x float>)
|
declare <3 x float> @_Z4log2Dv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3madfff(float, float, float)
|
declare float @_Z3madfff(float, float, float)
|
||||||
declare <2 x float> @_Z3madDv2_fS_S_(<2 x float>, <2 x float>, <2 x float>)
|
declare <2 x float> @_Z3madDv2_fS_S_(<2 x float>, <2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z3madDv3_fS_S_(<3 x float>, <3 x float>, <3 x float>)
|
declare <3 x float> @_Z3madDv3_fS_S_(<3 x float>, <3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3powff(float, float)
|
declare float @_Z3powff(float, float)
|
||||||
declare <2 x float> @_Z3powDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z3powDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z3powDv3_fS_(<3 x float>, <3 x float>)
|
declare <3 x float> @_Z3powDv3_fS_(<3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4pownfi(float, i32)
|
declare float @_Z4pownfi(float, i32)
|
||||||
declare <2 x float> @_Z4pownDv2_fDv2_i(<2 x float>, <2 x i32>)
|
declare <2 x float> @_Z4pownDv2_fDv2_i(<2 x float>, <2 x i32>)
|
||||||
declare <3 x float> @_Z4pownDv3_fDv3_i(<3 x float>, <3 x i32>)
|
declare <3 x float> @_Z4pownDv3_fDv3_i(<3 x float>, <3 x i32>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4powrff(float, float)
|
declare float @_Z4powrff(float, float)
|
||||||
declare <2 x float> @_Z4powrDv2_fS_(<2 x float>, <2 x float>)
|
declare <2 x float> @_Z4powrDv2_fS_(<2 x float>, <2 x float>)
|
||||||
declare <3 x float> @_Z4powrDv3_fS_(<3 x float>, <3 x float>)
|
declare <3 x float> @_Z4powrDv3_fS_(<3 x float>, <3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4rintf(float)
|
declare float @_Z4rintf(float)
|
||||||
declare <2 x float> @_Z4rintDv2_f(<2 x float>)
|
declare <2 x float> @_Z4rintDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z4rintDv3_f(<3 x float>)
|
declare <3 x float> @_Z4rintDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals all --version 4
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals all --version 4
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib,instcombine -amdgpu-prelink %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z5rootnfi(float, i32)
|
declare float @_Z5rootnfi(float, i32)
|
||||||
declare <2 x float> @_Z5rootnDv2_fDv2_i(<2 x float>, <2 x i32>)
|
declare <2 x float> @_Z5rootnDv2_fDv2_i(<2 x float>, <2 x i32>)
|
||||||
declare <3 x float> @_Z5rootnDv3_fDv3_i(<3 x float>, <3 x i32>)
|
declare <3 x float> @_Z5rootnDv3_fDv3_i(<3 x float>, <3 x i32>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z5roundf(float)
|
declare float @_Z5roundf(float)
|
||||||
declare <2 x float> @_Z5roundDv2_f(<2 x float>)
|
declare <2 x float> @_Z5roundDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z5roundDv3_f(<3 x float>)
|
declare <3 x float> @_Z5roundDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
; sin, cos, and sincos are already defined in the module.
|
; sin, cos, and sincos are already defined in the module.
|
||||||
|
|
||||||
define float @_Z3sinf(float %x) {
|
define float @_Z3sinf(float %x) {
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
; sin and cos are already defined in the module but sincos isn't.
|
; sin and cos are already defined in the module but sincos isn't.
|
||||||
|
|
||||||
define float @_Z3sinf(float noundef %x) {
|
define float @_Z3sinf(float noundef %x) {
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -O1 -mtriple=amdgcn-- -amdgpu-simplify-libcall=1 -amdgpu-prelink < %s | FileCheck %s
|
; RUN: opt -S -O1 -mtriple=amdgcn-- -amdgpu-simplify-libcall=1 -amdgpu-prelink < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3sinf(float) #0
|
declare float @_Z3sinf(float) #0
|
||||||
declare float @_Z3cosf(float) #0
|
declare float @_Z3cosf(float) #0
|
||||||
declare <2 x float> @_Z3sinDv2_f(<2 x float>) #0
|
declare <2 x float> @_Z3sinDv2_f(<2 x float>) #0
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-attributes --check-globals --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-attributes --check-globals --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib -amdgpu-prelink < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib -amdgpu-prelink < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z3sinf(float noundef)
|
declare float @_Z3sinf(float noundef)
|
||||||
declare float @_Z3cosf(float noundef)
|
declare float @_Z3cosf(float noundef)
|
||||||
declare <2 x float> @_Z3sinDv2_f(<2 x float> noundef)
|
declare <2 x float> @_Z3sinDv2_f(<2 x float> noundef)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes=amdgpu-simplifylib < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare extern_weak float @_Z3sinf(float noundef)
|
declare extern_weak float @_Z3sinf(float noundef)
|
||||||
declare extern_weak float @_Z3cosf(float noundef)
|
declare extern_weak float @_Z3cosf(float noundef)
|
||||||
|
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z4sqrtf(float)
|
declare float @_Z4sqrtf(float)
|
||||||
declare <2 x float> @_Z4sqrtDv2_f(<2 x float>)
|
declare <2 x float> @_Z4sqrtDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z4sqrtDv3_f(<3 x float>)
|
declare <3 x float> @_Z4sqrtDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-simplifylib %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare float @_Z5truncf(float)
|
declare float @_Z5truncf(float)
|
||||||
declare <2 x float> @_Z5truncDv2_f(<2 x float>)
|
declare <2 x float> @_Z5truncDv2_f(<2 x float>)
|
||||||
declare <3 x float> @_Z5truncDv3_f(<3 x float>)
|
declare <3 x float> @_Z5truncDv3_f(<3 x float>)
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature --check-globals
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature --check-globals
|
||||||
; RUN: opt -mtriple=amdgcn-unknown-amdhsa -S -passes=amdgpu-attributor < %s | FileCheck -check-prefix=HSA %s
|
; RUN: opt -mtriple=amdgcn-unknown-amdhsa -S -passes=amdgpu-attributor < %s | FileCheck -check-prefix=HSA %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
declare i32 @llvm.amdgcn.workgroup.id.x() #0
|
declare i32 @llvm.amdgcn.workgroup.id.x() #0
|
||||||
declare i32 @llvm.amdgcn.workgroup.id.y() #0
|
declare i32 @llvm.amdgcn.workgroup.id.y() #0
|
||||||
declare i32 @llvm.amdgcn.workgroup.id.z() #0
|
declare i32 @llvm.amdgcn.workgroup.id.z() #0
|
||||||
|
@ -1,6 +1,5 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa --amdgpu-annotate-uniform < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa --amdgpu-annotate-uniform < %s | FileCheck -check-prefix=OPT %s
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-annotate-uniform < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-annotate-uniform < %s | FileCheck -check-prefix=OPT %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
|
|
||||||
; OPT-LABEL: @amdgpu_noclobber_global(
|
; OPT-LABEL: @amdgpu_noclobber_global(
|
||||||
|
@ -12,7 +12,6 @@
|
|||||||
; for buffer-related memcpy() calls turns into something reasonable in
|
; for buffer-related memcpy() calls turns into something reasonable in
|
||||||
; the backend, despite the wide intermediate vectors
|
; the backend, despite the wide intermediate vectors
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
;; memcpy
|
;; memcpy
|
||||||
|
@ -7,8 +7,6 @@
|
|||||||
; RUN: llc -mtriple=amdgcn -mcpu=tonga -mattr=-flat-for-global -amdgpu-scalarize-global-loads=false -mattr=-promote-alloca < %s | FileCheck -check-prefix=GCN -check-prefix=VI -check-prefix=SICIVI %s
|
; RUN: llc -mtriple=amdgcn -mcpu=tonga -mattr=-flat-for-global -amdgpu-scalarize-global-loads=false -mattr=-promote-alloca < %s | FileCheck -check-prefix=GCN -check-prefix=VI -check-prefix=SICIVI %s
|
||||||
; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -mattr=-promote-alloca -amdgpu-scalarize-global-loads=false < %s | FileCheck -check-prefix=GCN -check-prefix=GFX9 %s
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -mattr=-promote-alloca -amdgpu-scalarize-global-loads=false < %s | FileCheck -check-prefix=GCN -check-prefix=GFX9 %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
; OPT-LABEL: @test_sink_global_small_offset_i32(
|
; OPT-LABEL: @test_sink_global_small_offset_i32(
|
||||||
; OPT-CI-NOT: getelementptr i32, ptr addrspace(1) %in
|
; OPT-CI-NOT: getelementptr i32, ptr addrspace(1) %in
|
||||||
; OPT-VI: getelementptr i32, ptr addrspace(1) %in
|
; OPT-VI: getelementptr i32, ptr addrspace(1) %in
|
||||||
|
@ -6,7 +6,6 @@
|
|||||||
# GCN: {{^body}}
|
# GCN: {{^body}}
|
||||||
|
|
||||||
--- |
|
--- |
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
target triple = "amdgcn--amdpal"
|
target triple = "amdgcn--amdpal"
|
||||||
|
|
||||||
define amdgpu_cs void @_amdgpu_cs_main(<3 x i32>) #0 {
|
define amdgpu_cs void @_amdgpu_cs_main(<3 x i32>) #0 {
|
||||||
|
@ -6,7 +6,6 @@
|
|||||||
# GCN: {{^body}}
|
# GCN: {{^body}}
|
||||||
|
|
||||||
--- |
|
--- |
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
target triple = "amdgcn--amdpal"
|
target triple = "amdgcn--amdpal"
|
||||||
|
|
||||||
; Function Attrs: nounwind
|
; Function Attrs: nounwind
|
||||||
|
@ -15,7 +15,6 @@
|
|||||||
#
|
#
|
||||||
|
|
||||||
--- |
|
--- |
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
target triple = "amdgcn--amdpal"
|
target triple = "amdgcn--amdpal"
|
||||||
|
|
||||||
define amdgpu_ps void @main() #0 {
|
define amdgpu_ps void @main() #0 {
|
||||||
|
@ -6,7 +6,6 @@
|
|||||||
# GCN: {{^body}}
|
# GCN: {{^body}}
|
||||||
|
|
||||||
--- |
|
--- |
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
target triple = "amdgcn--amdpal"
|
target triple = "amdgcn--amdpal"
|
||||||
|
|
||||||
; Function Attrs: nounwind
|
; Function Attrs: nounwind
|
||||||
|
@ -1,7 +1,5 @@
|
|||||||
; NOTE: There must be no spill reload inside the loop starting with LBB0_1:
|
; NOTE: There must be no spill reload inside the loop starting with LBB0_1:
|
||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx908 < %s | FileCheck %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx908 < %s | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9-p9:192:256:256:32"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
|
||||||
|
|
||||||
define amdgpu_kernel void @foo(ptr %.sroa.1.0.copyload, ptr %0, ptr %1, ptr %2, ptr %3, ptr %4, ptr %5, ptr %6, ptr %7, ptr %8, ptr %9, ptr %10, ptr %11, ptr %12, ptr %13, ptr %14, ptr %15, ptr %16, ptr %17, ptr %18, ptr %19, ptr %20, ptr %21, ptr %22, ptr %23, ptr %24, ptr %25, ptr %26, ptr %27, ptr %28, ptr %29, ptr %30, ptr %31, ptr %32, ptr %33, double %34, double %35, double %36, float %37, float %38, float %39, float %40, ptr %41) {
|
define amdgpu_kernel void @foo(ptr %.sroa.1.0.copyload, ptr %0, ptr %1, ptr %2, ptr %3, ptr %4, ptr %5, ptr %6, ptr %7, ptr %8, ptr %9, ptr %10, ptr %11, ptr %12, ptr %13, ptr %14, ptr %15, ptr %16, ptr %17, ptr %18, ptr %19, ptr %20, ptr %21, ptr %22, ptr %23, ptr %24, ptr %25, ptr %26, ptr %27, ptr %28, ptr %29, ptr %30, ptr %31, ptr %32, ptr %33, double %34, double %35, double %36, float %37, float %38, float %39, float %40, ptr %41) {
|
||||||
; CHECK-LABEL: foo:
|
; CHECK-LABEL: foo:
|
||||||
|
@ -1,7 +1,5 @@
|
|||||||
; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -print-after=si-annotate-control-flow %s -o /dev/null 2>&1 | FileCheck %s
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -print-after=si-annotate-control-flow %s -o /dev/null 2>&1 | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "n32"
|
|
||||||
|
|
||||||
; CHECK-LABEL: @switch_unreachable_default
|
; CHECK-LABEL: @switch_unreachable_default
|
||||||
|
|
||||||
define amdgpu_kernel void @switch_unreachable_default(ptr addrspace(1) %out, ptr addrspace(1) %in0, ptr addrspace(1) %in1) #0 {
|
define amdgpu_kernel void @switch_unreachable_default(ptr addrspace(1) %out, ptr addrspace(1) %in0, ptr addrspace(1) %in1) #0 {
|
||||||
|
@ -3,7 +3,6 @@
|
|||||||
; RUN: llc -global-isel=1 -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 < %s | FileCheck -check-prefix=GFX9-GISEL %s
|
; RUN: llc -global-isel=1 -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 < %s | FileCheck -check-prefix=GFX9-GISEL %s
|
||||||
; RUN: llc -global-isel=0 -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 < %s | FileCheck -check-prefix=GFX11-SDAG %s
|
; RUN: llc -global-isel=0 -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 < %s | FileCheck -check-prefix=GFX11-SDAG %s
|
||||||
; RUN: llc -global-isel=1 -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 < %s | FileCheck -check-prefix=GFX11-GISEL %s
|
; RUN: llc -global-isel=1 -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1100 < %s | FileCheck -check-prefix=GFX11-GISEL %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
define amdgpu_kernel void @test_dynamic_stackalloc_kernel_uniform(i32 %n) {
|
define amdgpu_kernel void @test_dynamic_stackalloc_kernel_uniform(i32 %n) {
|
||||||
; GFX9-SDAG-LABEL: test_dynamic_stackalloc_kernel_uniform:
|
; GFX9-SDAG-LABEL: test_dynamic_stackalloc_kernel_uniform:
|
||||||
|
@ -1,6 +1,5 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: -p --function-signature
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: -p --function-signature
|
||||||
; RUN: opt -S --passes=expand-variadics --expand-variadics-override=lowering < %s | FileCheck %s
|
; RUN: opt -S --passes=expand-variadics --expand-variadics-override=lowering < %s | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
; Check the variables are lowered to the locations this target expects
|
; Check the variables are lowered to the locations this target expects
|
||||||
@ -540,5 +539,3 @@ entry:
|
|||||||
tail call void (...) %0(%struct.libcS %.fca.5.insert)
|
tail call void (...) %0(%struct.libcS %.fca.5.insert)
|
||||||
ret void
|
ret void
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: llc -debug-only=machine-scheduler -mtriple=amdgcn-- -verify-machineinstrs %s -o - 2>&1| FileCheck -check-prefix=DEBUG %s
|
; RUN: llc -debug-only=machine-scheduler -mtriple=amdgcn-- -verify-machineinstrs %s -o - 2>&1| FileCheck -check-prefix=DEBUG %s
|
||||||
target datalayout = "A5"
|
|
||||||
; REQUIRES: asserts
|
; REQUIRES: asserts
|
||||||
|
|
||||||
; Verify that the extload generated from %eval has the default
|
; Verify that the extload generated from %eval has the default
|
||||||
|
@ -1,7 +1,6 @@
|
|||||||
; RUN: opt -passes='default<O1>,instnamer' -mtriple=amdgcn-- -S -o - %s | FileCheck -check-prefixes=GCN,O1 %s
|
; RUN: opt -passes='default<O1>,instnamer' -mtriple=amdgcn-- -S -o - %s | FileCheck -check-prefixes=GCN,O1 %s
|
||||||
; RUN: opt -passes='default<O2>,instnamer' -mtriple=amdgcn-- -S -o - %s | FileCheck -check-prefixes=GCN,O2 %s
|
; RUN: opt -passes='default<O2>,instnamer' -mtriple=amdgcn-- -S -o - %s | FileCheck -check-prefixes=GCN,O2 %s
|
||||||
; RUN: opt -passes='default<O3>,instnamer' -mtriple=amdgcn-- -S -o - %s | FileCheck -check-prefixes=GCN,O3 %s
|
; RUN: opt -passes='default<O3>,instnamer' -mtriple=amdgcn-- -S -o - %s | FileCheck -check-prefixes=GCN,O3 %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; GCN-LABEL: t0
|
; GCN-LABEL: t0
|
||||||
; O1-NOT: alloca
|
; O1-NOT: alloca
|
||||||
|
@ -3,8 +3,6 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -amdgpu-stress-function-calls -passes=amdgpu-always-inline -amdgpu-enable-lower-module-lds=false %s | FileCheck --check-prefix=ALL %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -amdgpu-stress-function-calls -passes=amdgpu-always-inline -amdgpu-enable-lower-module-lds=false %s | FileCheck --check-prefix=ALL %s
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -amdgpu-stress-function-calls -passes=amdgpu-always-inline -amdgpu-enable-lower-module-lds=false %s | FileCheck --check-prefix=ALL %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -amdgpu-stress-function-calls -passes=amdgpu-always-inline -amdgpu-enable-lower-module-lds=false %s | FileCheck --check-prefix=ALL %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
@lds0 = addrspace(3) global i32 poison, align 4
|
@lds0 = addrspace(3) global i32 poison, align 4
|
||||||
@lds1 = addrspace(3) global [512 x i32] poison, align 4
|
@lds1 = addrspace(3) global [512 x i32] poison, align 4
|
||||||
@nested.lds.address = addrspace(1) global ptr addrspace(3) @lds0, align 4
|
@nested.lds.address = addrspace(1) global ptr addrspace(3) @lds0, align 4
|
||||||
|
@ -2,8 +2,6 @@
|
|||||||
; RUN: opt -passes=loop-idiom -S < %s -mtriple=amdgcn -mcpu=tahiti -verify-machineinstrs| FileCheck --check-prefix=SI --check-prefix=FUNC %s
|
; RUN: opt -passes=loop-idiom -S < %s -mtriple=amdgcn -mcpu=tahiti -verify-machineinstrs| FileCheck --check-prefix=SI --check-prefix=FUNC %s
|
||||||
; RUN: opt -passes=loop-idiom -S < %s -mtriple=amdgcn -mcpu=tonga -verify-machineinstrs| FileCheck --check-prefix=SI --check-prefix=FUNC %s
|
; RUN: opt -passes=loop-idiom -S < %s -mtriple=amdgcn -mcpu=tonga -verify-machineinstrs| FileCheck --check-prefix=SI --check-prefix=FUNC %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
; Make sure loop-idiom doesn't create memcpy or memset. There are no library
|
; Make sure loop-idiom doesn't create memcpy or memset. There are no library
|
||||||
; implementations of these for R600.
|
; implementations of these for R600.
|
||||||
|
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
define ptr addrspace(7) @recur.inner.1(ptr addrspace(7) %x, i32 %v) {
|
define ptr addrspace(7) @recur.inner.1(ptr addrspace(7) %x, i32 %v) {
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
@buf = external addrspace(8) global i8
|
@buf = external addrspace(8) global i8
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
;; This should optimize to just the offset part
|
;; This should optimize to just the offset part
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
;; memcpy
|
;; memcpy
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
define void @loads(ptr addrspace(8) %buf) {
|
define void @loads(ptr addrspace(8) %buf) {
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
define void @scalar_copy(ptr %a, ptr %b) {
|
define void @scalar_copy(ptr %a, ptr %b) {
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
define ptr addrspace(7) @gep(ptr addrspace(7) %in, i32 %idx) {
|
define ptr addrspace(7) @gep(ptr addrspace(7) %in, i32 %idx) {
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers -check-debugify < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -amdgpu-lower-buffer-fat-pointers -check-debugify < %s | FileCheck %s
|
||||||
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers,check-debugify < %s | FileCheck %s
|
; RUN: opt -S -mcpu=gfx900 -passes=amdgpu-lower-buffer-fat-pointers,check-debugify < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8"
|
|
||||||
target triple = "amdgcn--"
|
target triple = "amdgcn--"
|
||||||
|
|
||||||
define float @debug_stash_pointer(ptr addrspace(8) %buf, i32 %idx, ptr addrspace(8) %aux) !dbg !5 {
|
define float @debug_stash_pointer(ptr addrspace(8) %buf, i32 %idx, ptr addrspace(8) %aux) !dbg !5 {
|
||||||
|
@ -2,8 +2,6 @@
|
|||||||
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -o - -passes=amdgpu-lower-kernel-arguments %s | FileCheck -check-prefixes=GCN,HSA %s
|
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -o - -passes=amdgpu-lower-kernel-arguments %s | FileCheck -check-prefixes=GCN,HSA %s
|
||||||
; RUN: opt -mtriple=amdgcn-- -S -o - -passes=amdgpu-lower-kernel-arguments %s | FileCheck -check-prefixes=GCN,MESA %s
|
; RUN: opt -mtriple=amdgcn-- -S -o - -passes=amdgpu-lower-kernel-arguments %s | FileCheck -check-prefixes=GCN,MESA %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
declare void @llvm.fake.use(...)
|
declare void @llvm.fake.use(...)
|
||||||
|
|
||||||
define amdgpu_kernel void @kern_noargs() {
|
define amdgpu_kernel void @kern_noargs() {
|
||||||
@ -489,7 +487,7 @@ define amdgpu_kernel void @kern_lds_ptr(ptr addrspace(3) %lds) #0 {
|
|||||||
; HSA-NEXT: ret void
|
; HSA-NEXT: ret void
|
||||||
;
|
;
|
||||||
; MESA-LABEL: @kern_lds_ptr(
|
; MESA-LABEL: @kern_lds_ptr(
|
||||||
; MESA-NEXT: [[KERN_LDS_PTR_KERNARG_SEGMENT:%.*]] = call nonnull align 16 dereferenceable(264) ptr addrspace(4) @llvm.amdgcn.kernarg.segment.ptr()
|
; MESA-NEXT: [[KERN_LDS_PTR_KERNARG_SEGMENT:%.*]] = call nonnull align 16 dereferenceable(260) ptr addrspace(4) @llvm.amdgcn.kernarg.segment.ptr()
|
||||||
; MESA-NEXT: [[LDS_KERNARG_OFFSET:%.*]] = getelementptr inbounds i8, ptr addrspace(4) [[KERN_LDS_PTR_KERNARG_SEGMENT]], i64 36
|
; MESA-NEXT: [[LDS_KERNARG_OFFSET:%.*]] = getelementptr inbounds i8, ptr addrspace(4) [[KERN_LDS_PTR_KERNARG_SEGMENT]], i64 36
|
||||||
; MESA-NEXT: [[LDS_LOAD:%.*]] = load ptr addrspace(3), ptr addrspace(4) [[LDS_KERNARG_OFFSET]], align 4, !invariant.load [[META0]]
|
; MESA-NEXT: [[LDS_LOAD:%.*]] = load ptr addrspace(3), ptr addrspace(4) [[LDS_KERNARG_OFFSET]], align 4, !invariant.load [[META0]]
|
||||||
; MESA-NEXT: store i32 0, ptr addrspace(3) [[LDS_LOAD]], align 4
|
; MESA-NEXT: store i32 0, ptr addrspace(3) [[LDS_LOAD]], align 4
|
||||||
@ -500,10 +498,15 @@ define amdgpu_kernel void @kern_lds_ptr(ptr addrspace(3) %lds) #0 {
|
|||||||
}
|
}
|
||||||
|
|
||||||
define amdgpu_kernel void @kern_lds_ptr_si(ptr addrspace(3) %lds) #2 {
|
define amdgpu_kernel void @kern_lds_ptr_si(ptr addrspace(3) %lds) #2 {
|
||||||
; GCN-LABEL: @kern_lds_ptr_si(
|
; HSA-LABEL: @kern_lds_ptr_si(
|
||||||
; GCN-NEXT: [[KERN_LDS_PTR_SI_KERNARG_SEGMENT:%.*]] = call nonnull align 16 dereferenceable(264) ptr addrspace(4) @llvm.amdgcn.kernarg.segment.ptr()
|
; HSA-NEXT: [[KERN_LDS_PTR_SI_KERNARG_SEGMENT:%.*]] = call nonnull align 16 dereferenceable(264) ptr addrspace(4) @llvm.amdgcn.kernarg.segment.ptr()
|
||||||
; GCN-NEXT: store i32 0, ptr addrspace(3) [[LDS:%.*]], align 4
|
; HSA-NEXT: store i32 0, ptr addrspace(3) [[LDS:%.*]], align 4
|
||||||
; GCN-NEXT: ret void
|
; HSA-NEXT: ret void
|
||||||
|
;
|
||||||
|
; MESA-LABEL: @kern_lds_ptr_si(
|
||||||
|
; MESA-NEXT: [[KERN_LDS_PTR_SI_KERNARG_SEGMENT:%.*]] = call nonnull align 16 dereferenceable(260) ptr addrspace(4) @llvm.amdgcn.kernarg.segment.ptr()
|
||||||
|
; MESA-NEXT: store i32 0, ptr addrspace(3) [[LDS:%.*]], align 4
|
||||||
|
; MESA-NEXT: ret void
|
||||||
;
|
;
|
||||||
store i32 0, ptr addrspace(3) %lds, align 4
|
store i32 0, ptr addrspace(3) %lds, align 4
|
||||||
ret void
|
ret void
|
||||||
|
@ -3,9 +3,6 @@
|
|||||||
|
|
||||||
; ModuleID = 'kernel_round1_passing.bc'
|
; ModuleID = 'kernel_round1_passing.bc'
|
||||||
source_filename = "/tmp/comgr-295d04/input/CompileSource"
|
source_filename = "/tmp/comgr-295d04/input/CompileSource"
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
|
||||||
|
|
||||||
@kernel_round1.first_words_data = external hidden unnamed_addr addrspace(3) global [896 x i8], align 1
|
@kernel_round1.first_words_data = external hidden unnamed_addr addrspace(3) global [896 x i8], align 1
|
||||||
@kernel_round1.collisionsData = external hidden unnamed_addr addrspace(3) global [3840 x i32], align 4
|
@kernel_round1.collisionsData = external hidden unnamed_addr addrspace(3) global [3840 x i32], align 4
|
||||||
@kernel_round1.collisionsNum = external hidden addrspace(3) global i32, align 4
|
@kernel_round1.collisionsNum = external hidden addrspace(3) global i32, align 4
|
||||||
|
@ -6,7 +6,6 @@
|
|||||||
; Confirm registers reserved in SIMachineFunctionInfo are those expected during
|
; Confirm registers reserved in SIMachineFunctionInfo are those expected during
|
||||||
; lowering, even when e.g. spilling is required due to being at OptNone.
|
; lowering, even when e.g. spilling is required due to being at OptNone.
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
target triple = "amdgcn-amd-amdpal"
|
target triple = "amdgcn-amd-amdpal"
|
||||||
|
|
||||||
define amdgpu_vs void @noop_vs() {
|
define amdgpu_vs void @noop_vs() {
|
||||||
|
@ -7,9 +7,6 @@
|
|||||||
; RUN: llc -mtriple=amdgcn-amd-amdpal -mcpu=gfx1010 < %s | FileCheck -check-prefixes=GFX10 %s
|
; RUN: llc -mtriple=amdgcn-amd-amdpal -mcpu=gfx1010 < %s | FileCheck -check-prefixes=GFX10 %s
|
||||||
; RUN: llc -mtriple=amdgcn-amd-amdpal -mcpu=gfx1010 -global-isel < %s | FileCheck -check-prefixes=GFX10 %s
|
; RUN: llc -mtriple=amdgcn-amd-amdpal -mcpu=gfx1010 -global-isel < %s | FileCheck -check-prefixes=GFX10 %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
|
|
||||||
define amdgpu_cs void @test_simple_indirect_call() {
|
define amdgpu_cs void @test_simple_indirect_call() {
|
||||||
; ATTRIBUTOR_GCN-LABEL: define {{[^@]+}}@test_simple_indirect_call
|
; ATTRIBUTOR_GCN-LABEL: define {{[^@]+}}@test_simple_indirect_call
|
||||||
; ATTRIBUTOR_GCN-SAME: () #[[ATTR0:[0-9]+]] {
|
; ATTRIBUTOR_GCN-SAME: () #[[ATTR0:[0-9]+]] {
|
||||||
|
@ -1,7 +1,6 @@
|
|||||||
; RUN: llc -mtriple=r600 -mcpu=redwood -disable-promote-alloca-to-vector < %s | FileCheck %s -check-prefix=R600 -check-prefix=FUNC
|
; RUN: llc -mtriple=r600 -mcpu=redwood -disable-promote-alloca-to-vector < %s | FileCheck %s -check-prefix=R600 -check-prefix=FUNC
|
||||||
; RUN: llc -mtriple=r600 -mcpu=redwood < %s | FileCheck %s -check-prefix=R600-VECT -check-prefix=FUNC
|
; RUN: llc -mtriple=r600 -mcpu=redwood < %s | FileCheck %s -check-prefix=R600-VECT -check-prefix=FUNC
|
||||||
; RUN: opt -S -mtriple=r600-unknown-unknown -mcpu=redwood -passes=amdgpu-promote-alloca -disable-promote-alloca-to-vector < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=r600-unknown-unknown -mcpu=redwood -passes=amdgpu-promote-alloca -disable-promote-alloca-to-vector < %s | FileCheck -check-prefix=OPT %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
declare i32 @llvm.r600.read.tidig.x() nounwind readnone
|
declare i32 @llvm.r600.read.tidig.x() nounwind readnone
|
||||||
|
|
||||||
|
@ -1,7 +1,5 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -passes=amdgpu-promote-alloca %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -passes=amdgpu-promote-alloca %s | FileCheck -check-prefix=OPT %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
declare void @llvm.lifetime.start.p5(i64, ptr addrspace(5) nocapture) #0
|
declare void @llvm.lifetime.start.p5(i64, ptr addrspace(5) nocapture) #0
|
||||||
declare void @llvm.lifetime.end.p5(i64, ptr addrspace(5) nocapture) #0
|
declare void @llvm.lifetime.end.p5(i64, ptr addrspace(5) nocapture) #0
|
||||||
|
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -passes=amdgpu-promote-alloca < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -passes=amdgpu-promote-alloca < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
define amdgpu_kernel void @test_overwrite(i64 %val, i1 %cond) {
|
define amdgpu_kernel void @test_overwrite(i64 %val, i1 %cond) {
|
||||||
; CHECK-LABEL: define amdgpu_kernel void @test_overwrite
|
; CHECK-LABEL: define amdgpu_kernel void @test_overwrite
|
||||||
; CHECK-SAME: (i64 [[VAL:%.*]], i1 [[COND:%.*]]) {
|
; CHECK-SAME: (i64 [[VAL:%.*]], i1 [[COND:%.*]]) {
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -passes=amdgpu-promote-alloca -amdgpu-promote-alloca-to-vector-limit=512 -amdgpu-promote-alloca-to-vector-max-regs=32 < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -passes=amdgpu-promote-alloca -amdgpu-promote-alloca-to-vector-limit=512 -amdgpu-promote-alloca-to-vector-max-regs=32 < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
define void @test_trivial_subvector(<2 x i64> %val.0, <2 x i64> %val.1) {
|
define void @test_trivial_subvector(<2 x i64> %val.0, <2 x i64> %val.1) {
|
||||||
; CHECK-LABEL: define void @test_trivial_subvector
|
; CHECK-LABEL: define void @test_trivial_subvector
|
||||||
; CHECK-SAME: (<2 x i64> [[VAL_0:%.*]], <2 x i64> [[VAL_1:%.*]]) {
|
; CHECK-SAME: (<2 x i64> [[VAL_0:%.*]], <2 x i64> [[VAL_1:%.*]]) {
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; RUN: opt -S -disable-promote-alloca-to-vector -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -passes=amdgpu-promote-alloca < %s | FileCheck -check-prefix=IR %s
|
; RUN: opt -S -disable-promote-alloca-to-vector -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -passes=amdgpu-promote-alloca < %s | FileCheck -check-prefix=IR %s
|
||||||
; RUN: llc -disable-promote-alloca-to-vector -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -amdgpu-enable-lower-module-lds=false < %s | FileCheck -check-prefix=ASM %s
|
; RUN: llc -disable-promote-alloca-to-vector -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -amdgpu-enable-lower-module-lds=false < %s | FileCheck -check-prefix=ASM %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
@all_lds = internal unnamed_addr addrspace(3) global [16384 x i32] poison, align 4
|
@all_lds = internal unnamed_addr addrspace(3) global [16384 x i32] poison, align 4
|
||||||
@some_lds = internal unnamed_addr addrspace(3) global [32 x i32] poison, align 4
|
@some_lds = internal unnamed_addr addrspace(3) global [32 x i32] poison, align 4
|
||||||
@some_dynamic_lds = external hidden addrspace(3) global [0 x i32], align 4
|
@some_dynamic_lds = external hidden addrspace(3) global [0 x i32], align 4
|
||||||
|
@ -1,7 +1,5 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -passes=amdgpu-promote-alloca < %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -passes=amdgpu-promote-alloca < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
; CHECK-LABEL: @lds_promoted_alloca_select_invalid_pointer_operand(
|
; CHECK-LABEL: @lds_promoted_alloca_select_invalid_pointer_operand(
|
||||||
; CHECK: %alloca = alloca i32
|
; CHECK: %alloca = alloca i32
|
||||||
; CHECK: select i1 undef, ptr addrspace(5) poison, ptr addrspace(5) %alloca
|
; CHECK: select i1 undef, ptr addrspace(5) poison, ptr addrspace(5) %alloca
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes=amdgpu-lower-kernel-attributes,instcombine,infer-alignment %s | FileCheck -enable-var-scope %s
|
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes=amdgpu-lower-kernel-attributes,instcombine,infer-alignment %s | FileCheck -enable-var-scope %s
|
||||||
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes=amdgpu-lower-kernel-attributes,instcombine,infer-alignment %s | FileCheck -enable-var-scope %s
|
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes=amdgpu-lower-kernel-attributes,instcombine,infer-alignment %s | FileCheck -enable-var-scope %s
|
||||||
|
|
||||||
target datalayout = "n32"
|
|
||||||
|
|
||||||
; CHECK-LABEL: @invalid_reqd_work_group_size(
|
; CHECK-LABEL: @invalid_reqd_work_group_size(
|
||||||
; CHECK: load i16,
|
; CHECK: load i16,
|
||||||
define amdgpu_kernel void @invalid_reqd_work_group_size(ptr addrspace(1) %out) #0 !reqd_work_group_size !1 {
|
define amdgpu_kernel void @invalid_reqd_work_group_size(ptr addrspace(1) %out) #0 !reqd_work_group_size !1 {
|
||||||
|
@ -24,7 +24,6 @@
|
|||||||
--- |
|
--- |
|
||||||
; ModuleID = 'sdwa-scalar-ops.opt.ll'
|
; ModuleID = 'sdwa-scalar-ops.opt.ll'
|
||||||
source_filename = "sdwa-scalar-ops.opt.ll"
|
source_filename = "sdwa-scalar-ops.opt.ll"
|
||||||
target datalayout = "e-p:32:32-p1:64:64-p2:64:64-p3:32:32-p4:64:64-p5:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64"
|
|
||||||
|
|
||||||
define amdgpu_kernel void @sdwa_imm_operand(ptr addrspace(1) nocapture %arg) {
|
define amdgpu_kernel void @sdwa_imm_operand(ptr addrspace(1) nocapture %arg) {
|
||||||
bb:
|
bb:
|
||||||
|
@ -1,8 +1,5 @@
|
|||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx906 -verify-machineinstrs -o - %s | FileCheck %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx906 -verify-machineinstrs -o - %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-ni:7:8"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
|
||||||
|
|
||||||
; CHECK-LABEL: {{^}}t0:
|
; CHECK-LABEL: {{^}}t0:
|
||||||
; CHECK: s_load_dwordx2 s[[[PTR_LO:[0-9]+]]:[[PTR_HI:[0-9]+]]], s[8:9], 0x0
|
; CHECK: s_load_dwordx2 s[[[PTR_LO:[0-9]+]]:[[PTR_HI:[0-9]+]]], s[8:9], 0x0
|
||||||
; CHECK: v_mov_b32_e32 v{{[0-9]+}}, s[[PTR_HI]]
|
; CHECK: v_mov_b32_e32 v{{[0-9]+}}, s[[PTR_HI]]
|
||||||
|
@ -2,7 +2,6 @@
|
|||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=fiji -mattr=-flat-for-global -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,FIJI %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=fiji -mattr=-flat-for-global -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,FIJI %s
|
||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=hawaii -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,HAWAII %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=hawaii -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,HAWAII %s
|
||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -mattr=-flat-for-global -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,GFX9 %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -mattr=-flat-for-global -enable-ipra=0 -verify-machineinstrs < %s | FileCheck -enable-var-scope -check-prefixes=GCN,GFX9 %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; FIXME: Why is this commuted only sometimes?
|
; FIXME: Why is this commuted only sometimes?
|
||||||
define fastcc i32 @i32_fastcc_i32_i32(i32 %arg0, i32 %arg1) #1 {
|
define fastcc i32 @i32_fastcc_i32_i32(i32 %arg0, i32 %arg1) #1 {
|
||||||
|
@ -3,8 +3,6 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes='amdgpu-attributor<closed-world>' %s | FileCheck --check-prefixes=CHECK,CW %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes='amdgpu-attributor<closed-world>' %s | FileCheck --check-prefixes=CHECK,CW %s
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes='amdgpu-attributor<closed-world>' -amdgpu-indirect-call-specialization-threshold=0 %s | FileCheck --check-prefixes=CHECK,NO %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes='amdgpu-attributor<closed-world>' -amdgpu-indirect-call-specialization-threshold=0 %s | FileCheck --check-prefixes=CHECK,NO %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
@G = global i32 0, align 4
|
@G = global i32 0, align 4
|
||||||
|
|
||||||
;.
|
;.
|
||||||
|
@ -3,8 +3,6 @@
|
|||||||
|
|
||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 < %s | FileCheck -check-prefix=GFX9 %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 < %s | FileCheck -check-prefix=GFX9 %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
define internal void @indirect() {
|
define internal void @indirect() {
|
||||||
; ATTRIBUTOR_GCN-LABEL: define {{[^@]+}}@indirect
|
; ATTRIBUTOR_GCN-LABEL: define {{[^@]+}}@indirect
|
||||||
; ATTRIBUTOR_GCN-SAME: () #[[ATTR0:[0-9]+]] {
|
; ATTRIBUTOR_GCN-SAME: () #[[ATTR0:[0-9]+]] {
|
||||||
|
@ -3,8 +3,6 @@
|
|||||||
; RUN: opt -mtriple=amdgcn-- -O1 -S -disable-promote-alloca-to-vector < %s | FileCheck %s --check-prefixes=FUNC,FULL-UNROLL
|
; RUN: opt -mtriple=amdgcn-- -O1 -S -disable-promote-alloca-to-vector < %s | FileCheck %s --check-prefixes=FUNC,FULL-UNROLL
|
||||||
; RUN: opt -mtriple=amdgcn-- -passes='default<O1>' -S -disable-promote-alloca-to-vector < %s | FileCheck %s --check-prefixes=FUNC,FULL-UNROLL
|
; RUN: opt -mtriple=amdgcn-- -passes='default<O1>' -S -disable-promote-alloca-to-vector < %s | FileCheck %s --check-prefixes=FUNC,FULL-UNROLL
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; This test contains a simple loop that initializes an array declared in
|
; This test contains a simple loop that initializes an array declared in
|
||||||
; private memory. This loop would be fully unrolled if we could not SROA
|
; private memory. This loop would be fully unrolled if we could not SROA
|
||||||
; the alloca. Check that we successfully eliminate it before the unroll,
|
; the alloca. Check that we successfully eliminate it before the unroll,
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt -S --amdgpu-annotate-uniform < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S --amdgpu-annotate-uniform < %s | FileCheck -check-prefix=OPT %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; "load vaddr" depends on the store, so we should not mark vaddr as amdgpu.noclobber.
|
; "load vaddr" depends on the store, so we should not mark vaddr as amdgpu.noclobber.
|
||||||
|
|
||||||
|
@ -6,8 +6,6 @@
|
|||||||
; because all functions involving convergence tokens will fail the
|
; because all functions involving convergence tokens will fail the
|
||||||
; machine verifier after register allocation.
|
; machine verifier after register allocation.
|
||||||
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
|
||||||
|
|
||||||
define void @tail_call_uniform_vgpr_value_convergence_tokens() #0 {
|
define void @tail_call_uniform_vgpr_value_convergence_tokens() #0 {
|
||||||
; CHECK-LABEL: name: tail_call_uniform_vgpr_value_convergence_tokens
|
; CHECK-LABEL: name: tail_call_uniform_vgpr_value_convergence_tokens
|
||||||
; CHECK: bb.0 (%ir-block.0):
|
; CHECK: bb.0 (%ir-block.0):
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
||||||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -verify-machineinstrs < %s | FileCheck %s
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -verify-machineinstrs < %s | FileCheck %s
|
||||||
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
|
||||||
|
|
||||||
; The tail call target is known uniform, but will be in a VGPR, so we
|
; The tail call target is known uniform, but will be in a VGPR, so we
|
||||||
; need readfirstlane to legalize it.
|
; need readfirstlane to legalize it.
|
||||||
define void @tail_call_uniform_vgpr_value() {
|
define void @tail_call_uniform_vgpr_value() {
|
||||||
|
@ -1,6 +1,5 @@
|
|||||||
; RUN: llc -mtriple=amdgcn-- -mcpu=unknown -verify-machineinstrs < %s 2>&1 | FileCheck -check-prefix=ERROR -check-prefix=GCN %s
|
; RUN: llc -mtriple=amdgcn-- -mcpu=unknown -verify-machineinstrs < %s 2>&1 | FileCheck -check-prefix=ERROR -check-prefix=GCN %s
|
||||||
; RUN: llc -mtriple=r600-- -mcpu=unknown -verify-machineinstrs < %s 2>&1 | FileCheck -check-prefix=ERROR -check-prefix=R600 %s
|
; RUN: llc -mtriple=r600-- -mcpu=unknown -verify-machineinstrs < %s 2>&1 | FileCheck -check-prefix=ERROR -check-prefix=R600 %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; Should not crash when the processor is not recognized and the
|
; Should not crash when the processor is not recognized and the
|
||||||
; wavefront size feature not set.
|
; wavefront size feature not set.
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; RUN: opt -mtriple=amdgcn-- -passes='loop-unroll,simplifycfg,sroa' %s -S -o - | FileCheck %s
|
; RUN: opt -mtriple=amdgcn-- -passes='loop-unroll,simplifycfg,sroa' %s -S -o - | FileCheck %s
|
||||||
; RUN: opt -mtriple=r600-- -passes='loop-unroll,simplifycfg,sroa' %s -S -o - | FileCheck %s
|
; RUN: opt -mtriple=r600-- -passes='loop-unroll,simplifycfg,sroa' %s -S -o - | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
; This test contains a simple loop that initializes an array declared in
|
; This test contains a simple loop that initializes an array declared in
|
||||||
; private memory. We want to make sure these kinds of loops are always
|
; private memory. We want to make sure these kinds of loops are always
|
||||||
; unrolled, because private memory is slow.
|
; unrolled, because private memory is slow.
|
||||||
|
@ -3,8 +3,6 @@
|
|||||||
; RUN: llc -mtriple=amdgcn-- -mcpu=tonga -mattr=+promote-alloca -verify-machineinstrs < %t.sroa.ll | FileCheck -enable-var-scope --check-prefixes=GCN,GCN-PROMOTE %s
|
; RUN: llc -mtriple=amdgcn-- -mcpu=tonga -mattr=+promote-alloca -verify-machineinstrs < %t.sroa.ll | FileCheck -enable-var-scope --check-prefixes=GCN,GCN-PROMOTE %s
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes='sroa,amdgpu-promote-alloca,instcombine' < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes='sroa,amdgpu-promote-alloca,instcombine' < %s | FileCheck -check-prefix=OPT %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; OPT-LABEL: @vector_read_alloca_bitcast(
|
; OPT-LABEL: @vector_read_alloca_bitcast(
|
||||||
; OPT-NOT: alloca
|
; OPT-NOT: alloca
|
||||||
; OPT: %0 = extractelement <4 x i32> <i32 0, i32 1, i32 2, i32 3>, i32 %index
|
; OPT: %0 = extractelement <4 x i32> <i32 0, i32 1, i32 2, i32 3>, i32 %index
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; RUN: opt -S -mtriple=amdgcn-- -passes='amdgpu-promote-alloca,sroa,instcombine' -amdgpu-promote-alloca-to-vector-max-regs=64 < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes='amdgpu-promote-alloca,sroa,instcombine' -amdgpu-promote-alloca-to-vector-max-regs=64 < %s | FileCheck -check-prefix=OPT %s
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes='amdgpu-promote-alloca,sroa,instcombine' -amdgpu-promote-alloca-to-vector-limit=32 -amdgpu-promote-alloca-to-vector-max-regs=64 < %s | FileCheck -check-prefix=LIMIT32 %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes='amdgpu-promote-alloca,sroa,instcombine' -amdgpu-promote-alloca-to-vector-limit=32 -amdgpu-promote-alloca-to-vector-max-regs=64 < %s | FileCheck -check-prefix=LIMIT32 %s
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; OPT-LABEL: @alloca_8xi64_max1024(
|
; OPT-LABEL: @alloca_8xi64_max1024(
|
||||||
; OPT-NOT: alloca
|
; OPT-NOT: alloca
|
||||||
; OPT: <8 x i64>
|
; OPT: <8 x i64>
|
||||||
|
@ -4,7 +4,6 @@
|
|||||||
; RUN: llc -mtriple=amdgcn-- -mcpu=tonga -mattr=+promote-alloca -verify-machineinstrs < %s | FileCheck -check-prefix=FUNC %s
|
; RUN: llc -mtriple=amdgcn-- -mcpu=tonga -mattr=+promote-alloca -verify-machineinstrs < %s | FileCheck -check-prefix=FUNC %s
|
||||||
; RUN: llc -mtriple=r600-- -mcpu=redwood < %s | FileCheck --check-prefixes=EG,FUNC %s
|
; RUN: llc -mtriple=r600-- -mcpu=redwood < %s | FileCheck --check-prefixes=EG,FUNC %s
|
||||||
; RUN: opt -S -mtriple=amdgcn-- -passes='amdgpu-promote-alloca,sroa,instcombine' < %s | FileCheck -check-prefix=OPT %s
|
; RUN: opt -S -mtriple=amdgcn-- -passes='amdgpu-promote-alloca,sroa,instcombine' < %s | FileCheck -check-prefix=OPT %s
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; OPT-LABEL: @vector_read(
|
; OPT-LABEL: @vector_read(
|
||||||
; OPT: %0 = extractelement <4 x i32> <i32 0, i32 1, i32 2, i32 3>, i32 %index
|
; OPT: %0 = extractelement <4 x i32> <i32 0, i32 1, i32 2, i32 3>, i32 %index
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
; Here we check that the global redzone sizes grow with the object size
|
; Here we check that the global redzone sizes grow with the object size
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
; Here we check that the global redzone sizes grow with the object size
|
; Here we check that the global redzone sizes grow with the object size
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
; Memory access to lds are not instrumented
|
; Memory access to lds are not instrumented
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
; Memory access to scratch are not instrumented
|
; Memory access to scratch are not instrumented
|
||||||
|
@ -1,7 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 3
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 3
|
||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
; RUN: opt < %s -passes=asan -asan-recover -S | FileCheck %s --check-prefix=RECOV
|
; RUN: opt < %s -passes=asan -asan-recover -S | FileCheck %s --check-prefix=RECOV
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
@x = addrspace(4) global [2 x i32] zeroinitializer, align 4
|
@x = addrspace(4) global [2 x i32] zeroinitializer, align 4
|
||||||
|
@ -1,7 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 3
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 3
|
||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
; RUN: opt < %s -passes=asan -asan-recover -S | FileCheck %s --check-prefix=RECOV
|
; RUN: opt < %s -passes=asan -asan-recover -S | FileCheck %s --check-prefix=RECOV
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
define protected amdgpu_kernel void @generic_store(ptr addrspace(1) %p, i32 %i) sanitize_address {
|
define protected amdgpu_kernel void @generic_store(ptr addrspace(1) %p, i32 %i) sanitize_address {
|
||||||
|
@ -1,7 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 3
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 3
|
||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
; RUN: opt < %s -passes=asan -asan-recover -S | FileCheck %s --check-prefix=RECOV
|
; RUN: opt < %s -passes=asan -asan-recover -S | FileCheck %s --check-prefix=RECOV
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
define protected amdgpu_kernel void @global_store(ptr addrspace(1) %p, i32 %i) sanitize_address {
|
define protected amdgpu_kernel void @global_store(ptr addrspace(1) %p, i32 %i) sanitize_address {
|
||||||
|
@ -1,7 +1,5 @@
|
|||||||
;RUN: opt < %s -mtriple=amdgcn-amd-amdhsa -passes=asan -S | FileCheck %s
|
;RUN: opt < %s -mtriple=amdgcn-amd-amdhsa -passes=asan -S | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
|
|
||||||
declare void @llvm.memcpy.p0.p0.i64(ptr noalias nocapture writeonly, ptr noalias nocapture readonly, i64, i1 immarg)
|
declare void @llvm.memcpy.p0.p0.i64(ptr noalias nocapture writeonly, ptr noalias nocapture readonly, i64, i1 immarg)
|
||||||
declare void @llvm.memcpy.p0.p1.i64(ptr noalias nocapture writeonly, ptr addrspace(1) noalias nocapture readonly, i64, i1 immarg)
|
declare void @llvm.memcpy.p0.p1.i64(ptr noalias nocapture writeonly, ptr addrspace(1) noalias nocapture readonly, i64, i1 immarg)
|
||||||
declare void @llvm.memcpy.p0.p2.i64(ptr noalias nocapture writeonly, ptr addrspace(2) noalias nocapture readonly, i64, i1 immarg)
|
declare void @llvm.memcpy.p0.p2.i64(ptr noalias nocapture writeonly, ptr addrspace(2) noalias nocapture readonly, i64, i1 immarg)
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
@g = addrspace(1) global [1 x i32] zeroinitializer, align 4
|
@g = addrspace(1) global [1 x i32] zeroinitializer, align 4
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
@G10 = addrspace(3) global [10 x i8] zeroinitializer, align 1
|
@G10 = addrspace(3) global [10 x i8] zeroinitializer, align 1
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
; RUN: opt < %s -passes=asan -S | FileCheck %s
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn-amd-amdhsa"
|
target triple = "amdgcn-amd-amdhsa"
|
||||||
|
|
||||||
@G10 = addrspace(5) global [10 x i8] zeroinitializer, align 1
|
@G10 = addrspace(5) global [10 x i8] zeroinitializer, align 1
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
||||||
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes=atomic-expand %s | FileCheck %s
|
; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes=atomic-expand %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
define i16 @test_atomicrmw_xchg_i16_global_system(ptr addrspace(1) %ptr, i16 %value) {
|
define i16 @test_atomicrmw_xchg_i16_global_system(ptr addrspace(1) %ptr, i16 %value) {
|
||||||
; CHECK-LABEL: @test_atomicrmw_xchg_i16_global_system(
|
; CHECK-LABEL: @test_atomicrmw_xchg_i16_global_system(
|
||||||
; CHECK-NEXT: [[ALIGNEDADDR:%.*]] = call ptr addrspace(1) @llvm.ptrmask.p1.i64(ptr addrspace(1) [[PTR:%.*]], i64 -4)
|
; CHECK-NEXT: [[ALIGNEDADDR:%.*]] = call ptr addrspace(1) @llvm.ptrmask.p1.i64(ptr addrspace(1) [[PTR:%.*]], i64 -4)
|
||||||
|
@ -1,7 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
||||||
; RUN: opt -passes=indvars -S < %s | FileCheck %s
|
; RUN: opt -passes=indvars -S < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
|
|
||||||
target triple = "amdgcn--amdpal"
|
target triple = "amdgcn--amdpal"
|
||||||
|
|
||||||
define void @f(ptr addrspace(7) %arg) {
|
define void @f(ptr addrspace(7) %arg) {
|
||||||
|
@ -9,8 +9,6 @@
|
|||||||
; twice as expensive as that on a 32-bit integer, or split into 2
|
; twice as expensive as that on a 32-bit integer, or split into 2
|
||||||
; 32-bit components.
|
; 32-bit components.
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
; CHECK-LABEL: @indvar_32_bit(
|
; CHECK-LABEL: @indvar_32_bit(
|
||||||
; CHECK-NOT: sext i32
|
; CHECK-NOT: sext i32
|
||||||
; CHECK: phi i32
|
; CHECK: phi i32
|
||||||
|
@ -1,8 +1,6 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
||||||
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=infer-address-spaces,instsimplify %s | FileCheck %s
|
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=infer-address-spaces,instsimplify %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
define i8 @ptrmask_cast_local_to_flat(ptr addrspace(3) %src.ptr, i64 %mask) {
|
define i8 @ptrmask_cast_local_to_flat(ptr addrspace(3) %src.ptr, i64 %mask) {
|
||||||
; CHECK-LABEL: @ptrmask_cast_local_to_flat(
|
; CHECK-LABEL: @ptrmask_cast_local_to_flat(
|
||||||
; CHECK-NEXT: [[CAST:%.*]] = addrspacecast ptr addrspace(3) [[SRC_PTR:%.*]] to ptr
|
; CHECK-NEXT: [[CAST:%.*]] = addrspacecast ptr addrspace(3) [[SRC_PTR:%.*]] to ptr
|
||||||
|
@ -2,8 +2,6 @@
|
|||||||
|
|
||||||
; REQUIRES: asserts
|
; REQUIRES: asserts
|
||||||
|
|
||||||
target datalayout = "A5"
|
|
||||||
|
|
||||||
; Verify we are properly adding cost of the -amdgpu-inline-arg-alloca-cost to the threshold.
|
; Verify we are properly adding cost of the -amdgpu-inline-arg-alloca-cost to the threshold.
|
||||||
|
|
||||||
define void @local_access_only(ptr addrspace(5) %p, i32 %idx) {
|
define void @local_access_only(ptr addrspace(5) %p, i32 %idx) {
|
||||||
|
@ -1,7 +1,5 @@
|
|||||||
; RUN: opt -mtriple=amdgcn--amdhsa -S -passes=inline -inline-threshold=0 < %s | FileCheck %s
|
; RUN: opt -mtriple=amdgcn--amdhsa -S -passes=inline -inline-threshold=0 < %s | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
define void @use_flat_ptr_arg(ptr nocapture %p) {
|
define void @use_flat_ptr_arg(ptr nocapture %p) {
|
||||||
entry:
|
entry:
|
||||||
%tmp1 = load float, ptr %p, align 4
|
%tmp1 = load float, ptr %p, align 4
|
||||||
|
@ -4,8 +4,6 @@
|
|||||||
; Make sure the optimization from memcpy-from-global.ll happens, but
|
; Make sure the optimization from memcpy-from-global.ll happens, but
|
||||||
; the constant source is not a global variable.
|
; the constant source is not a global variable.
|
||||||
|
|
||||||
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
|
|
||||||
|
|
||||||
; Simple memcpy to alloca from constant address space argument.
|
; Simple memcpy to alloca from constant address space argument.
|
||||||
define i8 @memcpy_constant_arg_ptr_to_alloca(ptr addrspace(4) noalias readonly align 4 dereferenceable(32) %arg, i32 %idx) {
|
define i8 @memcpy_constant_arg_ptr_to_alloca(ptr addrspace(4) noalias readonly align 4 dereferenceable(32) %arg, i32 %idx) {
|
||||||
; CHECK-LABEL: @memcpy_constant_arg_ptr_to_alloca(
|
; CHECK-LABEL: @memcpy_constant_arg_ptr_to_alloca(
|
||||||
|
Some files were not shown because too many files have changed in this diff Show More
Loading…
x
Reference in New Issue
Block a user