AMDGPU: Add new VA inline asm constraint for AV registers (#152665)
Add a new constraint corresponding to the AV_* register classes for operands which can allocate AGPRs or VGPRs. This applies to load and stores on gfx90a+, and srcA / srcB for MFMA instructions. The error emitted on unsupported targets isn't ideal, it is produced by the register allocator without a rationale, but it is consistent with the existing errors. I mostly want this for writing allocation tests.
This commit is contained in:
parent
a9c5d33bb4
commit
ff53086924
@ -5582,9 +5582,13 @@ AArch64:
|
||||
AMDGPU:
|
||||
|
||||
- ``r``: A 32 or 64-bit integer register.
|
||||
- ``[0-9]v``: The 32-bit VGPR register, number 0-9.
|
||||
- ``[0-9]s``: The 32-bit SGPR register, number 0-9.
|
||||
- ``[0-9]a``: The 32-bit AGPR register, number 0-9.
|
||||
- ``s``: SGPR register or tuple
|
||||
- ``v``: VGPR register or tuple
|
||||
- ``a``: AGPR register or tuple. Only valid on gfx908+.
|
||||
- ``VA``: VGPR or AGPR register or tuple. Only valid on gfx90a+.
|
||||
- ``v[0-9]``: The 32-bit VGPR register, number 0-9.
|
||||
- ``s[0-9]``: The 32-bit SGPR register, number 0-9.
|
||||
- ``a[0-9]``: The 32-bit AGPR register, number 0-9.
|
||||
- ``I``: An integer inline constant in the range from -16 to 64.
|
||||
- ``J``: A 16-bit signed integer constant.
|
||||
- ``A``: An integer or a floating-point inline constant.
|
||||
|
@ -16906,13 +16906,26 @@ SITargetLowering::getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI_,
|
||||
}
|
||||
break;
|
||||
}
|
||||
// We actually support i128, i16 and f16 as inline parameters
|
||||
// even if they are not reported as legal
|
||||
if (RC && (isTypeLegal(VT) || VT.SimpleTy == MVT::i128 ||
|
||||
VT.SimpleTy == MVT::i16 || VT.SimpleTy == MVT::f16))
|
||||
return std::pair(0U, RC);
|
||||
} else if (Constraint == "VA" && Subtarget->hasGFX90AInsts()) {
|
||||
const unsigned BitWidth = VT.getSizeInBits();
|
||||
switch (BitWidth) {
|
||||
case 16:
|
||||
RC = &AMDGPU::AV_32RegClass;
|
||||
break;
|
||||
default:
|
||||
RC = TRI->getVectorSuperClassForBitWidth(BitWidth);
|
||||
if (!RC)
|
||||
return std::pair(0U, nullptr);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
// We actually support i128, i16 and f16 as inline parameters
|
||||
// even if they are not reported as legal
|
||||
if (RC && (isTypeLegal(VT) || VT.SimpleTy == MVT::i128 ||
|
||||
VT.SimpleTy == MVT::i16 || VT.SimpleTy == MVT::f16))
|
||||
return std::pair(0U, RC);
|
||||
|
||||
auto [Kind, Idx, NumRegs] = AMDGPU::parseAsmConstraintPhysReg(Constraint);
|
||||
if (Kind != '\0') {
|
||||
if (Kind == 'v') {
|
||||
@ -16997,6 +17010,9 @@ SITargetLowering::getConstraintType(StringRef Constraint) const {
|
||||
case 'a':
|
||||
return C_RegisterClass;
|
||||
}
|
||||
} else if (Constraint.size() == 2) {
|
||||
if (Constraint == "VA")
|
||||
return C_RegisterClass;
|
||||
}
|
||||
if (isImmConstraint(Constraint)) {
|
||||
return C_Other;
|
||||
|
27
llvm/test/CodeGen/AMDGPU/inline-asm-av-constraint-err.ll
Normal file
27
llvm/test/CodeGen/AMDGPU/inline-asm-av-constraint-err.ll
Normal file
@ -0,0 +1,27 @@
|
||||
; RUN: not llc -mtriple=amdgcn -mcpu=gfx90a -filetype=null %s 2>&1 | FileCheck %s
|
||||
|
||||
; Make sure illegal type uses are correctly diagnosed
|
||||
|
||||
; CHECK: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_i8(i8 %x) {
|
||||
call void asm sideeffect "; use $0", "^VA"(i8 %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK: error: couldn't allocate output register for constraint 'VA'
|
||||
define i8 @def_A_i8() {
|
||||
%ret = call i8 asm sideeffect "; def $0", "=^VA"()
|
||||
ret i8 %ret
|
||||
}
|
||||
|
||||
; CHECK: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_i1(i1 %x) {
|
||||
call void asm sideeffect "; use $0", "^VA"(i1 %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK: error: couldn't allocate output register for constraint 'VA'
|
||||
define i1 @def_A_i1() {
|
||||
%ret = call i1 asm sideeffect "; def $0", "=^VA"()
|
||||
ret i1 %ret
|
||||
}
|
217
llvm/test/CodeGen/AMDGPU/inline-asm-av-constraint.ll
Normal file
217
llvm/test/CodeGen/AMDGPU/inline-asm-av-constraint.ll
Normal file
@ -0,0 +1,217 @@
|
||||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
||||
; RUN: not llc -mtriple=amdgcn -mcpu=gfx908 -filetype=null %s 2>&1 | FileCheck -check-prefix=ERR %s
|
||||
; RUN: llc -mtriple=amdgcn -mcpu=gfx90a < %s | FileCheck %s
|
||||
|
||||
; FIXME: Shouldn't emit and
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_i16(i16 %x) {
|
||||
; CHECK-LABEL: use_A_i16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: v_and_b32_e32 v0, 0xffff, v0
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(i16 %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_f16(half %x) {
|
||||
; CHECK-LABEL: use_A_f16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(half %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_bf16(bfloat %x) {
|
||||
; CHECK-LABEL: use_A_bf16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(bfloat %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_v2i16(<2 x i16> %x) {
|
||||
; CHECK-LABEL: use_A_v2i16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(<2 x i16> %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_v2f16(<2 x half> %x) {
|
||||
; CHECK-LABEL: use_A_v2f16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(<2 x half> %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_v2bf16(<2 x bfloat> %x) {
|
||||
; CHECK-LABEL: use_A_v2bf16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(<2 x bfloat> %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_i32(i32 %x) {
|
||||
; CHECK-LABEL: use_A_i32:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(i32 %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_f32(float %x) {
|
||||
; CHECK-LABEL: use_A_f32:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(float %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_i64(i64 %x) {
|
||||
; CHECK-LABEL: use_A_i64:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v[0:1]
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(i64 %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_f64(double %x) {
|
||||
; CHECK-LABEL: use_A_f64:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v[0:1]
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(double %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_p1(ptr addrspace(1) %x) {
|
||||
; CHECK-LABEL: use_A_p1:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v[0:1]
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(ptr addrspace(1) %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_v32i32(<32 x i32> %x) {
|
||||
; CHECK-LABEL: use_A_v32i32:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: buffer_load_dword v31, off, s[0:3], s32
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v[0:31]
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(<32 x i32> %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate input reg for constraint 'VA'
|
||||
define void @use_A_v32f32(<32 x float> %x) {
|
||||
; CHECK-LABEL: use_A_v32f32:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: buffer_load_dword v31, off, s[0:3], s32
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; use v[0:31]
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
call void asm sideeffect "; use $0", "^VA"(<32 x float> %x)
|
||||
ret void
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate output register for constraint 'VA'
|
||||
define i16 @def_A_i16() {
|
||||
; CHECK-LABEL: def_A_i16:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; def v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
%ret = call i16 asm sideeffect "; def $0", "=^VA"()
|
||||
ret i16 %ret
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate output register for constraint 'VA'
|
||||
define i32 @def_A_i32() {
|
||||
; CHECK-LABEL: def_A_i32:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; def v0
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
%ret = call i32 asm sideeffect "; def $0", "=^VA"()
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
; ERR: error: couldn't allocate output register for constraint 'VA'
|
||||
define ptr addrspace(1) @def_A_p1() {
|
||||
; CHECK-LABEL: def_A_p1:
|
||||
; CHECK: ; %bb.0:
|
||||
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; CHECK-NEXT: ;;#ASMSTART
|
||||
; CHECK-NEXT: ; def v[0:1]
|
||||
; CHECK-NEXT: ;;#ASMEND
|
||||
; CHECK-NEXT: s_setpc_b64 s[30:31]
|
||||
%ret = call ptr addrspace(1) asm sideeffect "; def $0", "=^VA"()
|
||||
ret ptr addrspace(1) %ret
|
||||
}
|
Loading…
x
Reference in New Issue
Block a user