
I'm not sure why these were bothering to check the instruction profile, since those profiles should only be used with these instruction classes.
771 lines
23 KiB
TableGen
771 lines
23 KiB
TableGen
//===-- VOPInstructions.td - Vector Instruction Defintions ----------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// dummies for outer let
|
|
class LetDummies {
|
|
bit isCommutable;
|
|
bit isConvertibleToThreeAddress;
|
|
bit isMoveImm;
|
|
bit isReMaterializable;
|
|
bit isAsCheapAsAMove;
|
|
bit VOPAsmPrefer32Bit;
|
|
bit FPDPRounding;
|
|
Predicate SubtargetPredicate;
|
|
string Constraints;
|
|
string DisableEncoding;
|
|
list<SchedReadWrite> SchedRW;
|
|
list<Register> Uses;
|
|
list<Register> Defs;
|
|
}
|
|
|
|
class VOP <string opName> {
|
|
string OpName = opName;
|
|
}
|
|
|
|
class VOPAnyCommon <dag outs, dag ins, string asm, list<dag> pattern> :
|
|
InstSI <outs, ins, asm, pattern> {
|
|
|
|
let mayLoad = 0;
|
|
let mayStore = 0;
|
|
let hasSideEffects = 0;
|
|
let UseNamedOperandTable = 1;
|
|
let VALU = 1;
|
|
let Uses = [EXEC];
|
|
}
|
|
|
|
class VOP_Pseudo <string opName, string suffix, VOPProfile P, dag outs, dag ins,
|
|
string asm, list<dag> pattern> :
|
|
InstSI <outs, ins, asm, pattern>,
|
|
VOP <opName>,
|
|
SIMCInstr <opName#suffix, SIEncodingFamily.NONE> {
|
|
let isPseudo = 1;
|
|
let isCodeGenOnly = 1;
|
|
let UseNamedOperandTable = 1;
|
|
|
|
string Mnemonic = opName;
|
|
VOPProfile Pfl = P;
|
|
|
|
string AsmOperands;
|
|
}
|
|
|
|
class VOP3Common <dag outs, dag ins, string asm = "",
|
|
list<dag> pattern = [], bit HasMods = 0,
|
|
bit VOP3Only = 0> :
|
|
VOPAnyCommon <outs, ins, asm, pattern> {
|
|
|
|
// Using complex patterns gives VOP3 patterns a very high complexity rating,
|
|
// but standalone patterns are almost always preferred, so we need to adjust the
|
|
// priority lower. The goal is to use a high number to reduce complexity to
|
|
// zero (or less than zero).
|
|
let AddedComplexity = -1000;
|
|
|
|
let VOP3 = 1;
|
|
|
|
let AsmVariantName = AMDGPUAsmVariants.VOP3;
|
|
let AsmMatchConverter = !if(!eq(HasMods,1), "cvtVOP3", "");
|
|
|
|
let isCodeGenOnly = 0;
|
|
|
|
int Size = 8;
|
|
|
|
// Because SGPRs may be allowed if there are multiple operands, we
|
|
// need a post-isel hook to insert copies in order to avoid
|
|
// violating constant bus requirements.
|
|
let hasPostISelHook = 1;
|
|
}
|
|
|
|
class VOP3_Pseudo <string opName, VOPProfile P, list<dag> pattern = [],
|
|
bit VOP3Only = 0, bit isVOP3P = 0, bit isVop3OpSel = 0> :
|
|
VOP_Pseudo <opName, "_e64", P, P.Outs64,
|
|
!if(isVop3OpSel,
|
|
P.InsVOP3OpSel,
|
|
!if(!and(isVOP3P, P.IsPacked), P.InsVOP3P, P.Ins64)),
|
|
"", pattern> {
|
|
|
|
let VOP3_OPSEL = isVop3OpSel;
|
|
let IsPacked = P.IsPacked;
|
|
let IsMAI = P.IsMAI;
|
|
|
|
let AsmOperands = !if(isVop3OpSel,
|
|
P.AsmVOP3OpSel,
|
|
!if(!and(isVOP3P, P.IsPacked), P.AsmVOP3P, P.Asm64));
|
|
|
|
let Size = 8;
|
|
let mayLoad = 0;
|
|
let mayStore = 0;
|
|
let hasSideEffects = 0;
|
|
|
|
// Because SGPRs may be allowed if there are multiple operands, we
|
|
// need a post-isel hook to insert copies in order to avoid
|
|
// violating constant bus requirements.
|
|
let hasPostISelHook = 1;
|
|
|
|
// Using complex patterns gives VOP3 patterns a very high complexity rating,
|
|
// but standalone patterns are almost always preferred, so we need to adjust the
|
|
// priority lower. The goal is to use a high number to reduce complexity to
|
|
// zero (or less than zero).
|
|
let AddedComplexity = -1000;
|
|
|
|
let VOP3 = 1;
|
|
let VALU = 1;
|
|
let FPClamp = P.HasFPClamp;
|
|
let IntClamp = P.HasIntClamp;
|
|
let ClampLo = P.HasClampLo;
|
|
let ClampHi = P.HasClampHi;
|
|
|
|
let Uses = [EXEC];
|
|
|
|
let AsmVariantName = AMDGPUAsmVariants.VOP3;
|
|
let AsmMatchConverter =
|
|
!if(isVOP3P,
|
|
"cvtVOP3P",
|
|
!if(!or(P.HasModifiers, !or(P.HasOMod, P.HasIntClamp)),
|
|
"cvtVOP3",
|
|
""));
|
|
}
|
|
|
|
class VOP3P_Pseudo <string opName, VOPProfile P, list<dag> pattern = []> :
|
|
VOP3_Pseudo<opName, P, pattern, 1, 1> {
|
|
let VOP3P = 1;
|
|
}
|
|
|
|
class VOP3_Real <VOP_Pseudo ps, int EncodingFamily> :
|
|
InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
|
|
SIMCInstr <ps.PseudoInstr, EncodingFamily> {
|
|
|
|
let isPseudo = 0;
|
|
let isCodeGenOnly = 0;
|
|
let UseNamedOperandTable = 1;
|
|
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
|
|
// copy relevant pseudo op flags
|
|
let SubtargetPredicate = ps.SubtargetPredicate;
|
|
let OtherPredicates = ps.OtherPredicates;
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
|
let AsmVariantName = ps.AsmVariantName;
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
let TSFlags = ps.TSFlags;
|
|
let UseNamedOperandTable = ps.UseNamedOperandTable;
|
|
let Uses = ps.Uses;
|
|
let Defs = ps.Defs;
|
|
|
|
VOPProfile Pfl = ps.Pfl;
|
|
}
|
|
|
|
// XXX - Is there any reason to distingusih this from regular VOP3
|
|
// here?
|
|
class VOP3P_Real<VOP_Pseudo ps, int EncodingFamily> :
|
|
VOP3_Real<ps, EncodingFamily>;
|
|
|
|
class VOP3a<VOPProfile P> : Enc64 {
|
|
bits<4> src0_modifiers;
|
|
bits<9> src0;
|
|
bits<3> src1_modifiers;
|
|
bits<9> src1;
|
|
bits<3> src2_modifiers;
|
|
bits<9> src2;
|
|
bits<1> clamp;
|
|
bits<2> omod;
|
|
|
|
let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0);
|
|
let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0);
|
|
let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0);
|
|
|
|
let Inst{31-26} = 0x34; //encoding
|
|
let Inst{40-32} = !if(P.HasSrc0, src0, 0);
|
|
let Inst{49-41} = !if(P.HasSrc1, src1, 0);
|
|
let Inst{58-50} = !if(P.HasSrc2, src2, 0);
|
|
let Inst{60-59} = !if(P.HasOMod, omod, 0);
|
|
let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
|
|
let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0);
|
|
let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0);
|
|
}
|
|
|
|
class VOP3a_gfx6_gfx7<bits<9> op, VOPProfile p> : VOP3a<p> {
|
|
let Inst{11} = !if(p.HasClamp, clamp{0}, 0);
|
|
let Inst{25-17} = op;
|
|
}
|
|
|
|
class VOP3a_gfx10<bits<10> op, VOPProfile p> : VOP3a<p> {
|
|
let Inst{15} = !if(p.HasClamp, clamp{0}, 0);
|
|
let Inst{25-16} = op;
|
|
let Inst{31-26} = 0x35;
|
|
}
|
|
|
|
class VOP3a_vi <bits<10> op, VOPProfile P> : VOP3a<P> {
|
|
let Inst{25-16} = op;
|
|
let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
|
|
}
|
|
|
|
class VOP3e_gfx6_gfx7<bits<9> op, VOPProfile p> : VOP3a_gfx6_gfx7<op, p> {
|
|
bits<8> vdst;
|
|
let Inst{7-0} = !if(p.EmitDst, vdst{7-0}, 0);
|
|
}
|
|
|
|
class VOP3e_gfx10<bits<10> op, VOPProfile p> : VOP3a_gfx10<op, p> {
|
|
bits<8> vdst;
|
|
let Inst{7-0} = !if(p.EmitDst, vdst{7-0}, 0);
|
|
}
|
|
|
|
class VOP3e_vi <bits<10> op, VOPProfile P> : VOP3a_vi <op, P> {
|
|
bits<8> vdst;
|
|
let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0);
|
|
}
|
|
|
|
class VOP3OpSel_gfx9 <bits<10> op, VOPProfile P> : VOP3e_vi <op, P> {
|
|
let Inst{11} = !if(P.HasSrc0, src0_modifiers{2}, 0);
|
|
let Inst{12} = !if(P.HasSrc1, src1_modifiers{2}, 0);
|
|
let Inst{13} = !if(P.HasSrc2, src2_modifiers{2}, 0);
|
|
let Inst{14} = !if(P.HasDst, src0_modifiers{3}, 0);
|
|
}
|
|
|
|
class VOP3OpSel_gfx10<bits<10> op, VOPProfile p> : VOP3e_gfx10<op, p> {
|
|
let Inst{11} = !if(p.HasSrc0, src0_modifiers{2}, 0);
|
|
let Inst{12} = !if(p.HasSrc1, src1_modifiers{2}, 0);
|
|
let Inst{13} = !if(p.HasSrc2, src2_modifiers{2}, 0);
|
|
let Inst{14} = !if(p.HasDst, src0_modifiers{3}, 0);
|
|
}
|
|
|
|
// NB: For V_INTERP* opcodes, src0 is encoded as src1 and vice versa
|
|
class VOP3Interp_vi <bits<10> op, VOPProfile P> : VOP3e_vi <op, P> {
|
|
bits<2> attrchan;
|
|
bits<6> attr;
|
|
bits<1> high;
|
|
|
|
let Inst{8} = 0; // No modifiers for src0
|
|
let Inst{61} = 0;
|
|
|
|
let Inst{9} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0);
|
|
let Inst{62} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
|
|
|
|
let Inst{37-32} = attr;
|
|
let Inst{39-38} = attrchan;
|
|
let Inst{40} = !if(P.HasHigh, high, 0);
|
|
|
|
let Inst{49-41} = src0;
|
|
}
|
|
|
|
class VOP3Interp_gfx10<bits<10> op, VOPProfile p> : VOP3e_gfx10<op, p> {
|
|
bits<6> attr;
|
|
bits<2> attrchan;
|
|
bits<1> high;
|
|
|
|
let Inst{8} = 0;
|
|
let Inst{9} = !if(p.HasSrc0Mods, src0_modifiers{1}, 0);
|
|
let Inst{37-32} = attr;
|
|
let Inst{39-38} = attrchan;
|
|
let Inst{40} = !if(p.HasHigh, high, 0);
|
|
let Inst{49-41} = src0;
|
|
let Inst{61} = 0;
|
|
let Inst{62} = !if(p.HasSrc0Mods, src0_modifiers{0}, 0);
|
|
}
|
|
|
|
class VOP3be <VOPProfile P> : Enc64 {
|
|
bits<8> vdst;
|
|
bits<2> src0_modifiers;
|
|
bits<9> src0;
|
|
bits<2> src1_modifiers;
|
|
bits<9> src1;
|
|
bits<2> src2_modifiers;
|
|
bits<9> src2;
|
|
bits<7> sdst;
|
|
bits<2> omod;
|
|
|
|
let Inst{7-0} = vdst;
|
|
let Inst{14-8} = sdst;
|
|
let Inst{31-26} = 0x34; //encoding
|
|
let Inst{40-32} = !if(P.HasSrc0, src0, 0);
|
|
let Inst{49-41} = !if(P.HasSrc1, src1, 0);
|
|
let Inst{58-50} = !if(P.HasSrc2, src2, 0);
|
|
let Inst{60-59} = !if(P.HasOMod, omod, 0);
|
|
let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
|
|
let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0);
|
|
let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0);
|
|
}
|
|
|
|
class VOP3Pe <bits<10> op, VOPProfile P> : Enc64 {
|
|
bits<8> vdst;
|
|
// neg, neg_hi, op_sel put in srcN_modifiers
|
|
bits<4> src0_modifiers;
|
|
bits<9> src0;
|
|
bits<4> src1_modifiers;
|
|
bits<9> src1;
|
|
bits<4> src2_modifiers;
|
|
bits<9> src2;
|
|
bits<1> clamp;
|
|
|
|
let Inst{7-0} = vdst;
|
|
let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // neg_hi src0
|
|
let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // neg_hi src1
|
|
let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); // neg_hi src2
|
|
|
|
let Inst{11} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{2}, 0); // op_sel(0)
|
|
let Inst{12} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{2}, 0); // op_sel(1)
|
|
let Inst{13} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{2}, 0); // op_sel(2)
|
|
|
|
let Inst{14} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{3}, 0); // op_sel_hi(2)
|
|
|
|
let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
|
|
|
|
let Inst{25-16} = op;
|
|
let Inst{31-26} = 0x34; //encoding
|
|
let Inst{40-32} = !if(P.HasSrc0, src0, 0);
|
|
let Inst{49-41} = !if(P.HasSrc1, src1, 0);
|
|
let Inst{58-50} = !if(P.HasSrc2, src2, 0);
|
|
let Inst{59} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{3}, 0); // op_sel_hi(0)
|
|
let Inst{60} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{3}, 0); // op_sel_hi(1)
|
|
let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // neg (lo)
|
|
let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // neg (lo)
|
|
let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); // neg (lo)
|
|
}
|
|
|
|
class VOP3Pe_MAI <bits<10> op, VOPProfile P> : Enc64 {
|
|
bits<8> vdst;
|
|
bits<10> src0;
|
|
bits<10> src1;
|
|
bits<9> src2;
|
|
bits<3> blgp;
|
|
bits<3> cbsz;
|
|
bits<4> abid;
|
|
bits<1> clamp;
|
|
|
|
let Inst{7-0} = vdst;
|
|
|
|
let Inst{10-8} = !if(P.HasSrc1, cbsz, 0);
|
|
let Inst{14-11} = !if(P.HasSrc1, abid, 0);
|
|
|
|
let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
|
|
|
|
let Inst{25-16} = op;
|
|
let Inst{31-26} = 0x34; //encoding
|
|
let Inst{40-32} = !if(P.HasSrc0, src0{8-0}, 0);
|
|
let Inst{49-41} = !if(P.HasSrc1, src1{8-0}, 0);
|
|
let Inst{58-50} = !if(P.HasSrc2, src2, 0);
|
|
|
|
let Inst{59} = !if(P.HasSrc0, src0{9}, 0); // acc(0)
|
|
let Inst{60} = !if(P.HasSrc1, src1{9}, 0); // acc(1)
|
|
|
|
let Inst{63-61} = !if(P.HasSrc1, blgp, 0);
|
|
}
|
|
|
|
|
|
class VOP3Pe_gfx10 <bits<10> op, VOPProfile P> : VOP3Pe<op, P> {
|
|
let Inst{31-26} = 0x33; //encoding
|
|
}
|
|
|
|
class VOP3be_gfx6_gfx7<bits<9> op, VOPProfile p> : VOP3be<p> {
|
|
let Inst{25-17} = op;
|
|
}
|
|
|
|
class VOP3be_gfx10<bits<10> op, VOPProfile p> : VOP3be<p> {
|
|
bits<1> clamp;
|
|
let Inst{15} = !if(p.HasClamp, clamp{0}, 0);
|
|
let Inst{25-16} = op;
|
|
let Inst{31-26} = 0x35;
|
|
}
|
|
|
|
class VOP3be_vi <bits<10> op, VOPProfile P> : VOP3be<P> {
|
|
bits<1> clamp;
|
|
let Inst{25-16} = op;
|
|
let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
|
|
}
|
|
|
|
def SDWA {
|
|
// sdwa_sel
|
|
int BYTE_0 = 0;
|
|
int BYTE_1 = 1;
|
|
int BYTE_2 = 2;
|
|
int BYTE_3 = 3;
|
|
int WORD_0 = 4;
|
|
int WORD_1 = 5;
|
|
int DWORD = 6;
|
|
|
|
// dst_unused
|
|
int UNUSED_PAD = 0;
|
|
int UNUSED_SEXT = 1;
|
|
int UNUSED_PRESERVE = 2;
|
|
}
|
|
|
|
class VOP_SDWAe<VOPProfile P> : Enc64 {
|
|
bits<8> src0;
|
|
bits<3> src0_sel;
|
|
bits<2> src0_modifiers; // float: {abs,neg}, int {sext}
|
|
bits<3> src1_sel;
|
|
bits<2> src1_modifiers;
|
|
bits<3> dst_sel;
|
|
bits<2> dst_unused;
|
|
bits<1> clamp;
|
|
|
|
let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
|
|
let Inst{42-40} = !if(P.EmitDst, dst_sel{2-0}, 0);
|
|
let Inst{44-43} = !if(P.EmitDst, dst_unused{1-0}, 0);
|
|
let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0);
|
|
let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, 0);
|
|
let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0);
|
|
let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0);
|
|
let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, 0);
|
|
let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0);
|
|
let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0);
|
|
}
|
|
|
|
// GFX9 adds two features to SDWA:
|
|
// 1. Add 3 fields to the SDWA microcode word: S0, S1 and OMOD.
|
|
// a. S0 and S1 indicate that source 0 and 1 respectively are SGPRs rather
|
|
// than VGPRs (at most 1 can be an SGPR);
|
|
// b. OMOD is the standard output modifier (result *2, *4, /2)
|
|
// 2. Add a new version of the SDWA microcode word for VOPC: SDWAB. This
|
|
// replaces OMOD and the dest fields with SD and SDST (SGPR destination)
|
|
// field.
|
|
// a. When SD=1, the SDST is used as the destination for the compare result;
|
|
// b. When SD=0, VCC is used.
|
|
//
|
|
// In GFX9, V_MAC_F16, V_MAC_F32 opcodes cannot be used with SDWA
|
|
|
|
// gfx9 SDWA basic encoding
|
|
class VOP_SDWA9e<VOPProfile P> : Enc64 {
|
|
bits<9> src0; // {src0_sgpr{0}, src0{7-0}}
|
|
bits<3> src0_sel;
|
|
bits<2> src0_modifiers; // float: {abs,neg}, int {sext}
|
|
bits<3> src1_sel;
|
|
bits<2> src1_modifiers;
|
|
bits<1> src1_sgpr;
|
|
|
|
let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
|
|
let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, 0);
|
|
let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0);
|
|
let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0);
|
|
let Inst{55} = !if(P.HasSrc0, src0{8}, 0);
|
|
let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, 0);
|
|
let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0);
|
|
let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0);
|
|
let Inst{63} = 0; // src1_sgpr - should be specified in subclass
|
|
}
|
|
|
|
// gfx9 SDWA-A
|
|
class VOP_SDWA9Ae<VOPProfile P> : VOP_SDWA9e<P> {
|
|
bits<3> dst_sel;
|
|
bits<2> dst_unused;
|
|
bits<1> clamp;
|
|
bits<2> omod;
|
|
|
|
let Inst{42-40} = !if(P.EmitDst, dst_sel{2-0}, 0);
|
|
let Inst{44-43} = !if(P.EmitDst, dst_unused{1-0}, 0);
|
|
let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0);
|
|
let Inst{47-46} = !if(P.HasSDWAOMod, omod{1-0}, 0);
|
|
}
|
|
|
|
// gfx9 SDWA-B
|
|
class VOP_SDWA9Be<VOPProfile P> : VOP_SDWA9e<P> {
|
|
bits<8> sdst; // {vcc_sdst{0}, sdst{6-0}}
|
|
|
|
let Inst{46-40} = !if(P.EmitDst, sdst{6-0}, ?);
|
|
let Inst{47} = !if(P.EmitDst, sdst{7}, 0);
|
|
}
|
|
|
|
class VOP_SDWA_Pseudo <string opName, VOPProfile P, list<dag> pattern=[]> :
|
|
InstSI <P.OutsSDWA, P.InsSDWA, "", pattern>,
|
|
VOP <opName>,
|
|
SIMCInstr <opName#"_sdwa", SIEncodingFamily.NONE> {
|
|
|
|
let isPseudo = 1;
|
|
let isCodeGenOnly = 1;
|
|
let UseNamedOperandTable = 1;
|
|
|
|
string Mnemonic = opName;
|
|
string AsmOperands = P.AsmSDWA;
|
|
string AsmOperands9 = P.AsmSDWA9;
|
|
|
|
let Size = 8;
|
|
let mayLoad = 0;
|
|
let mayStore = 0;
|
|
let hasSideEffects = 0;
|
|
|
|
let VALU = 1;
|
|
let SDWA = 1;
|
|
let Uses = [EXEC];
|
|
|
|
let SubtargetPredicate = HasSDWA;
|
|
let AssemblerPredicate = HasSDWA;
|
|
let AsmVariantName = !if(P.HasExtSDWA, AMDGPUAsmVariants.SDWA,
|
|
AMDGPUAsmVariants.Disable);
|
|
let DecoderNamespace = "SDWA";
|
|
|
|
VOPProfile Pfl = P;
|
|
}
|
|
|
|
class VOP_SDWA_Real <VOP_SDWA_Pseudo ps> :
|
|
InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
|
|
SIMCInstr <ps.PseudoInstr, SIEncodingFamily.SDWA> {
|
|
|
|
let isPseudo = 0;
|
|
let isCodeGenOnly = 0;
|
|
|
|
let Defs = ps.Defs;
|
|
let Uses = ps.Uses;
|
|
let SchedRW = ps.SchedRW;
|
|
let hasSideEffects = ps.hasSideEffects;
|
|
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
|
|
// Copy relevant pseudo op flags
|
|
let SubtargetPredicate = ps.SubtargetPredicate;
|
|
let AssemblerPredicate = ps.AssemblerPredicate;
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
|
let AsmVariantName = ps.AsmVariantName;
|
|
let UseNamedOperandTable = ps.UseNamedOperandTable;
|
|
let DecoderNamespace = ps.DecoderNamespace;
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
let TSFlags = ps.TSFlags;
|
|
}
|
|
|
|
class Base_VOP_SDWA9_Real <VOP_SDWA_Pseudo ps> :
|
|
InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands9, []> {
|
|
|
|
let isPseudo = 0;
|
|
let isCodeGenOnly = 0;
|
|
|
|
let Defs = ps.Defs;
|
|
let Uses = ps.Uses;
|
|
let SchedRW = ps.SchedRW;
|
|
let hasSideEffects = ps.hasSideEffects;
|
|
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
|
|
let SubtargetPredicate = HasSDWA9;
|
|
let AssemblerPredicate = HasSDWA9;
|
|
let AsmVariantName = !if(ps.Pfl.HasExtSDWA9, AMDGPUAsmVariants.SDWA9,
|
|
AMDGPUAsmVariants.Disable);
|
|
let DecoderNamespace = "SDWA9";
|
|
|
|
// Copy relevant pseudo op flags
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
|
let UseNamedOperandTable = ps.UseNamedOperandTable;
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
let TSFlags = ps.TSFlags;
|
|
}
|
|
|
|
class VOP_SDWA9_Real <VOP_SDWA_Pseudo ps> :
|
|
Base_VOP_SDWA9_Real <ps >,
|
|
SIMCInstr <ps.PseudoInstr, SIEncodingFamily.SDWA9>;
|
|
|
|
class Base_VOP_SDWA10_Real<VOP_SDWA_Pseudo ps> : Base_VOP_SDWA9_Real<ps> {
|
|
let SubtargetPredicate = HasSDWA10;
|
|
let AssemblerPredicate = HasSDWA10;
|
|
let DecoderNamespace = "SDWA10";
|
|
}
|
|
|
|
class VOP_SDWA10_Real<VOP_SDWA_Pseudo ps> :
|
|
Base_VOP_SDWA10_Real<ps>, SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SDWA10>;
|
|
|
|
class VOP_DPPe<VOPProfile P, bit IsDPP16=0> : Enc64 {
|
|
bits<2> src0_modifiers;
|
|
bits<8> src0;
|
|
bits<2> src1_modifiers;
|
|
bits<9> dpp_ctrl;
|
|
bits<1> bound_ctrl;
|
|
bits<4> bank_mask;
|
|
bits<4> row_mask;
|
|
bit fi;
|
|
|
|
let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
|
|
let Inst{48-40} = dpp_ctrl;
|
|
let Inst{50} = !if(IsDPP16, fi, ?);
|
|
let Inst{51} = bound_ctrl;
|
|
let Inst{52} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // src0_neg
|
|
let Inst{53} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // src0_abs
|
|
let Inst{54} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // src1_neg
|
|
let Inst{55} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // src1_abs
|
|
let Inst{59-56} = bank_mask;
|
|
let Inst{63-60} = row_mask;
|
|
}
|
|
|
|
class VOP_DPP_Pseudo <string OpName, VOPProfile P, list<dag> pattern=[]> :
|
|
InstSI <P.OutsDPP, P.InsDPP, OpName#P.AsmDPP, pattern>,
|
|
VOP <OpName>,
|
|
SIMCInstr <OpName#"_dpp", SIEncodingFamily.NONE> {
|
|
|
|
let isPseudo = 1;
|
|
let isCodeGenOnly = 1;
|
|
|
|
let mayLoad = 0;
|
|
let mayStore = 0;
|
|
let hasSideEffects = 0;
|
|
let UseNamedOperandTable = 1;
|
|
|
|
let VALU = 1;
|
|
let DPP = 1;
|
|
let Size = 8;
|
|
let Uses = [EXEC];
|
|
let isConvergent = 1;
|
|
|
|
string Mnemonic = OpName;
|
|
string AsmOperands = P.AsmDPP;
|
|
|
|
let AsmMatchConverter = !if(!eq(P.HasModifiers,1), "cvtDPP", "");
|
|
let SubtargetPredicate = HasDPP;
|
|
let AssemblerPredicate = HasDPP;
|
|
let AsmVariantName = !if(P.HasExtDPP, AMDGPUAsmVariants.DPP,
|
|
AMDGPUAsmVariants.Disable);
|
|
let Constraints = !if(P.NumSrcArgs, P.TieRegDPP # " = $vdst", "");
|
|
let DisableEncoding = !if(P.NumSrcArgs, P.TieRegDPP, "");
|
|
let DecoderNamespace = "DPP";
|
|
|
|
VOPProfile Pfl = P;
|
|
}
|
|
|
|
class VOP_DPP_Real <VOP_DPP_Pseudo ps, int EncodingFamily> :
|
|
InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
|
|
SIMCInstr <ps.PseudoInstr, EncodingFamily> {
|
|
|
|
let isPseudo = 0;
|
|
let isCodeGenOnly = 0;
|
|
|
|
let Defs = ps.Defs;
|
|
let Uses = ps.Uses;
|
|
let SchedRW = ps.SchedRW;
|
|
let hasSideEffects = ps.hasSideEffects;
|
|
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
|
|
// Copy relevant pseudo op flags
|
|
let isConvergent = ps.isConvergent;
|
|
let SubtargetPredicate = ps.SubtargetPredicate;
|
|
let AssemblerPredicate = ps.AssemblerPredicate;
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
|
let AsmVariantName = ps.AsmVariantName;
|
|
let UseNamedOperandTable = ps.UseNamedOperandTable;
|
|
let DecoderNamespace = ps.DecoderNamespace;
|
|
let Constraints = ps.Constraints;
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
let TSFlags = ps.TSFlags;
|
|
}
|
|
|
|
class VOP_DPP <string OpName, VOPProfile P, bit IsDPP16,
|
|
dag InsDPP = !if(IsDPP16, P.InsDPP16, P.InsDPP),
|
|
string AsmDPP = !if(IsDPP16, P.AsmDPP16, P.AsmDPP)> :
|
|
InstSI <P.OutsDPP, InsDPP, OpName#AsmDPP, []>,
|
|
VOP_DPPe<P, IsDPP16> {
|
|
|
|
let mayLoad = 0;
|
|
let mayStore = 0;
|
|
let hasSideEffects = 0;
|
|
let UseNamedOperandTable = 1;
|
|
|
|
let VALU = 1;
|
|
let DPP = 1;
|
|
let Size = 8;
|
|
|
|
let AsmMatchConverter = !if(!eq(P.HasModifiers,1), "cvtDPP", "");
|
|
let SubtargetPredicate = HasDPP;
|
|
let AssemblerPredicate = HasDPP;
|
|
let AsmVariantName = !if(P.HasExtDPP, AMDGPUAsmVariants.DPP,
|
|
AMDGPUAsmVariants.Disable);
|
|
let Constraints = !if(P.NumSrcArgs, P.TieRegDPP # " = $vdst", "");
|
|
let DisableEncoding = !if(P.NumSrcArgs, P.TieRegDPP, "");
|
|
let DecoderNamespace = "DPP";
|
|
}
|
|
|
|
class VOP_DPP8e<VOPProfile P> : Enc64 {
|
|
bits<8> src0;
|
|
bits<24> dpp8;
|
|
bits<9> fi;
|
|
|
|
let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
|
|
let Inst{63-40} = dpp8{23-0};
|
|
}
|
|
|
|
class VOP_DPP8<string OpName, VOPProfile P> :
|
|
InstSI<P.OutsDPP8, P.InsDPP8, OpName#P.AsmDPP8, []>,
|
|
VOP_DPP8e<P> {
|
|
|
|
let mayLoad = 0;
|
|
let mayStore = 0;
|
|
let hasSideEffects = 0;
|
|
let UseNamedOperandTable = 1;
|
|
|
|
let VALU = 1;
|
|
let DPP = 1;
|
|
let Size = 8;
|
|
|
|
let AsmMatchConverter = "cvtDPP8";
|
|
let SubtargetPredicate = HasDPP8;
|
|
let AssemblerPredicate = HasDPP8;
|
|
let AsmVariantName = !if(P.HasExt, AMDGPUAsmVariants.DPP,
|
|
AMDGPUAsmVariants.Disable);
|
|
let Constraints = !if(P.NumSrcArgs, P.TieRegDPP # " = $vdst", "");
|
|
let DisableEncoding = !if(P.NumSrcArgs, P.TieRegDPP, "");
|
|
}
|
|
|
|
def DPP8Mode {
|
|
int FI_0 = 0xE9;
|
|
int FI_1 = 0xEA;
|
|
}
|
|
|
|
class getNumNodeArgs<SDPatternOperator Op> {
|
|
SDNode N = !cast<SDNode>(Op);
|
|
SDTypeProfile TP = N.TypeProfile;
|
|
int ret = TP.NumOperands;
|
|
}
|
|
|
|
|
|
class getDivergentFrag<SDPatternOperator Op> {
|
|
|
|
int NumSrcArgs = getNumNodeArgs<Op>.ret;
|
|
PatFrag ret = PatFrag <
|
|
!if(!eq(NumSrcArgs, 1),
|
|
(ops node:$src0),
|
|
!if(!eq(NumSrcArgs, 2),
|
|
(ops node:$src0, node:$src1),
|
|
(ops node:$src0, node:$src1, node:$src2))),
|
|
!if(!eq(NumSrcArgs, 1),
|
|
(Op $src0),
|
|
!if(!eq(NumSrcArgs, 2),
|
|
(Op $src0, $src1),
|
|
(Op $src0, $src1, $src2))),
|
|
[{ return N->isDivergent(); }]
|
|
>;
|
|
}
|
|
|
|
class VOPPatGen<SDPatternOperator Op, VOPProfile P> {
|
|
|
|
PatFrag Operator = getDivergentFrag < Op >.ret;
|
|
|
|
dag Ins = !foreach(tmp, P.Ins32, !subst(ins, Operator,
|
|
!subst(P.Src0RC32, P.Src0VT,
|
|
!subst(P.Src1RC32, P.Src1VT, tmp))));
|
|
|
|
|
|
dag Outs = !foreach(tmp, P.Outs32, !subst(outs, set,
|
|
!subst(P.DstRC, P.DstVT, tmp)));
|
|
|
|
list<dag> ret = [!con(Outs, (set Ins))];
|
|
}
|
|
|
|
class VOPPatOrNull<SDPatternOperator Op, VOPProfile P> {
|
|
list<dag> ret = !if(!ne(P.NeedPatGen,PatGenMode.NoPattern), VOPPatGen<Op, P>.ret, []);
|
|
}
|
|
|
|
class DivergentFragOrOp<SDPatternOperator Op, VOPProfile P> {
|
|
SDPatternOperator ret = !if(!eq(P.NeedPatGen,PatGenMode.Pattern),
|
|
!if(!isa<SDNode>(Op), getDivergentFrag<Op>.ret, Op), Op);
|
|
}
|
|
|
|
include "VOPCInstructions.td"
|
|
include "VOP1Instructions.td"
|
|
include "VOP2Instructions.td"
|
|
include "VOP3Instructions.td"
|
|
include "VOP3PInstructions.td"
|