AMDGPU: Add new VA inline asm constraint for AV registers (#152665)

Add a new constraint corresponding to the AV_* register classes
for operands which can allocate AGPRs or VGPRs. This applies
to load and stores on gfx90a+, and srcA / srcB for MFMA instructions.

The error emitted on unsupported targets isn't ideal, it is
produced by the register allocator without a rationale, but it is
consistent with the existing errors.

I mostly want this for writing allocation tests.
This commit is contained in:
Matt Arsenault 2025-08-12 10:17:28 +09:00 committed by GitHub
parent a9c5d33bb4
commit ff53086924
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
4 changed files with 272 additions and 8 deletions

View File

@ -5582,9 +5582,13 @@ AArch64:
AMDGPU:
- ``r``: A 32 or 64-bit integer register.
- ``[0-9]v``: The 32-bit VGPR register, number 0-9.
- ``[0-9]s``: The 32-bit SGPR register, number 0-9.
- ``[0-9]a``: The 32-bit AGPR register, number 0-9.
- ``s``: SGPR register or tuple
- ``v``: VGPR register or tuple
- ``a``: AGPR register or tuple. Only valid on gfx908+.
- ``VA``: VGPR or AGPR register or tuple. Only valid on gfx90a+.
- ``v[0-9]``: The 32-bit VGPR register, number 0-9.
- ``s[0-9]``: The 32-bit SGPR register, number 0-9.
- ``a[0-9]``: The 32-bit AGPR register, number 0-9.
- ``I``: An integer inline constant in the range from -16 to 64.
- ``J``: A 16-bit signed integer constant.
- ``A``: An integer or a floating-point inline constant.

View File

@ -16906,13 +16906,26 @@ SITargetLowering::getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI_,
}
break;
}
// We actually support i128, i16 and f16 as inline parameters
// even if they are not reported as legal
if (RC && (isTypeLegal(VT) || VT.SimpleTy == MVT::i128 ||
VT.SimpleTy == MVT::i16 || VT.SimpleTy == MVT::f16))
return std::pair(0U, RC);
} else if (Constraint == "VA" && Subtarget->hasGFX90AInsts()) {
const unsigned BitWidth = VT.getSizeInBits();
switch (BitWidth) {
case 16:
RC = &AMDGPU::AV_32RegClass;
break;
default:
RC = TRI->getVectorSuperClassForBitWidth(BitWidth);
if (!RC)
return std::pair(0U, nullptr);
break;
}
}
// We actually support i128, i16 and f16 as inline parameters
// even if they are not reported as legal
if (RC && (isTypeLegal(VT) || VT.SimpleTy == MVT::i128 ||
VT.SimpleTy == MVT::i16 || VT.SimpleTy == MVT::f16))
return std::pair(0U, RC);
auto [Kind, Idx, NumRegs] = AMDGPU::parseAsmConstraintPhysReg(Constraint);
if (Kind != '\0') {
if (Kind == 'v') {
@ -16997,6 +17010,9 @@ SITargetLowering::getConstraintType(StringRef Constraint) const {
case 'a':
return C_RegisterClass;
}
} else if (Constraint.size() == 2) {
if (Constraint == "VA")
return C_RegisterClass;
}
if (isImmConstraint(Constraint)) {
return C_Other;

View File

@ -0,0 +1,27 @@
; RUN: not llc -mtriple=amdgcn -mcpu=gfx90a -filetype=null %s 2>&1 | FileCheck %s
; Make sure illegal type uses are correctly diagnosed
; CHECK: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_i8(i8 %x) {
call void asm sideeffect "; use $0", "^VA"(i8 %x)
ret void
}
; CHECK: error: couldn't allocate output register for constraint 'VA'
define i8 @def_A_i8() {
%ret = call i8 asm sideeffect "; def $0", "=^VA"()
ret i8 %ret
}
; CHECK: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_i1(i1 %x) {
call void asm sideeffect "; use $0", "^VA"(i1 %x)
ret void
}
; CHECK: error: couldn't allocate output register for constraint 'VA'
define i1 @def_A_i1() {
%ret = call i1 asm sideeffect "; def $0", "=^VA"()
ret i1 %ret
}

View File

@ -0,0 +1,217 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: not llc -mtriple=amdgcn -mcpu=gfx908 -filetype=null %s 2>&1 | FileCheck -check-prefix=ERR %s
; RUN: llc -mtriple=amdgcn -mcpu=gfx90a < %s | FileCheck %s
; FIXME: Shouldn't emit and
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_i16(i16 %x) {
; CHECK-LABEL: use_A_i16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: v_and_b32_e32 v0, 0xffff, v0
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(i16 %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_f16(half %x) {
; CHECK-LABEL: use_A_f16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(half %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_bf16(bfloat %x) {
; CHECK-LABEL: use_A_bf16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(bfloat %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_v2i16(<2 x i16> %x) {
; CHECK-LABEL: use_A_v2i16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(<2 x i16> %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_v2f16(<2 x half> %x) {
; CHECK-LABEL: use_A_v2f16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(<2 x half> %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_v2bf16(<2 x bfloat> %x) {
; CHECK-LABEL: use_A_v2bf16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(<2 x bfloat> %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_i32(i32 %x) {
; CHECK-LABEL: use_A_i32:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(i32 %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_f32(float %x) {
; CHECK-LABEL: use_A_f32:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(float %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_i64(i64 %x) {
; CHECK-LABEL: use_A_i64:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v[0:1]
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(i64 %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_f64(double %x) {
; CHECK-LABEL: use_A_f64:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v[0:1]
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(double %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_p1(ptr addrspace(1) %x) {
; CHECK-LABEL: use_A_p1:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v[0:1]
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(ptr addrspace(1) %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_v32i32(<32 x i32> %x) {
; CHECK-LABEL: use_A_v32i32:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: buffer_load_dword v31, off, s[0:3], s32
; CHECK-NEXT: s_waitcnt vmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v[0:31]
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(<32 x i32> %x)
ret void
}
; ERR: error: couldn't allocate input reg for constraint 'VA'
define void @use_A_v32f32(<32 x float> %x) {
; CHECK-LABEL: use_A_v32f32:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: buffer_load_dword v31, off, s[0:3], s32
; CHECK-NEXT: s_waitcnt vmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; use v[0:31]
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
call void asm sideeffect "; use $0", "^VA"(<32 x float> %x)
ret void
}
; ERR: error: couldn't allocate output register for constraint 'VA'
define i16 @def_A_i16() {
; CHECK-LABEL: def_A_i16:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; def v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
%ret = call i16 asm sideeffect "; def $0", "=^VA"()
ret i16 %ret
}
; ERR: error: couldn't allocate output register for constraint 'VA'
define i32 @def_A_i32() {
; CHECK-LABEL: def_A_i32:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; def v0
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
%ret = call i32 asm sideeffect "; def $0", "=^VA"()
ret i32 %ret
}
; ERR: error: couldn't allocate output register for constraint 'VA'
define ptr addrspace(1) @def_A_p1() {
; CHECK-LABEL: def_A_p1:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ;;#ASMSTART
; CHECK-NEXT: ; def v[0:1]
; CHECK-NEXT: ;;#ASMEND
; CHECK-NEXT: s_setpc_b64 s[30:31]
%ret = call ptr addrspace(1) asm sideeffect "; def $0", "=^VA"()
ret ptr addrspace(1) %ret
}