2016-08-30 23:20:31 +08:00
|
|
|
//===-- SOPInstructions.td - SOP Instruction Defintions -------------------===//
|
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2016-08-30 23:20:31 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2016-10-13 02:00:51 +08:00
|
|
|
def GPRIdxModeMatchClass : AsmOperandClass {
|
|
|
|
let Name = "GPRIdxMode";
|
|
|
|
let PredicateMethod = "isGPRIdxMode";
|
2019-02-27 21:12:12 +08:00
|
|
|
let ParserMethod = "parseGPRIdxMode";
|
2016-10-13 02:00:51 +08:00
|
|
|
let RenderMethod = "addImmOperands";
|
|
|
|
}
|
|
|
|
|
|
|
|
def GPRIdxMode : Operand<i32> {
|
|
|
|
let PrintMethod = "printVGPRIndexMode";
|
|
|
|
let ParserMatchClass = GPRIdxModeMatchClass;
|
|
|
|
let OperandType = "OPERAND_IMMEDIATE";
|
|
|
|
}
|
|
|
|
|
2018-03-26 21:56:53 +08:00
|
|
|
class SOP_Pseudo<string opName, dag outs, dag ins, string asmOps,
|
|
|
|
list<dag> pattern=[]> :
|
|
|
|
InstSI<outs, ins, "", pattern>,
|
|
|
|
SIMCInstr<opName, SIEncodingFamily.NONE> {
|
|
|
|
|
|
|
|
let isPseudo = 1;
|
|
|
|
let isCodeGenOnly = 1;
|
|
|
|
|
|
|
|
string Mnemonic = opName;
|
|
|
|
string AsmOperands = asmOps;
|
|
|
|
|
|
|
|
bits<1> has_sdst = 0;
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOP1 Instructions
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
class SOP1_Pseudo <string opName, dag outs, dag ins,
|
|
|
|
string asmOps, list<dag> pattern=[]> :
|
2018-03-26 21:56:53 +08:00
|
|
|
SOP_Pseudo<opName, outs, ins, asmOps, pattern> {
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
let mayLoad = 0;
|
|
|
|
let mayStore = 0;
|
|
|
|
let hasSideEffects = 0;
|
|
|
|
let SALU = 1;
|
|
|
|
let SOP1 = 1;
|
|
|
|
let SchedRW = [WriteSALU];
|
2016-10-07 00:20:41 +08:00
|
|
|
let Size = 4;
|
2016-09-07 04:00:26 +08:00
|
|
|
let UseNamedOperandTable = 1;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
bits<1> has_src0 = 1;
|
|
|
|
bits<1> has_sdst = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOP1_Real<bits<8> op, SOP1_Pseudo ps> :
|
|
|
|
InstSI <ps.OutOperandList, ps.InOperandList,
|
|
|
|
ps.Mnemonic # " " # ps.AsmOperands, []>,
|
|
|
|
Enc32 {
|
|
|
|
|
|
|
|
let isPseudo = 0;
|
|
|
|
let isCodeGenOnly = 0;
|
2016-10-07 00:20:41 +08:00
|
|
|
let Size = 4;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
// copy relevant pseudo op flags
|
|
|
|
let SubtargetPredicate = ps.SubtargetPredicate;
|
|
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
|
|
|
|
|
|
|
// encoding
|
|
|
|
bits<7> sdst;
|
|
|
|
bits<8> src0;
|
|
|
|
|
|
|
|
let Inst{7-0} = !if(ps.has_src0, src0, ?);
|
|
|
|
let Inst{15-8} = op;
|
|
|
|
let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
|
|
|
|
let Inst{31-23} = 0x17d; //encoding;
|
|
|
|
}
|
|
|
|
|
2019-02-26 03:24:46 +08:00
|
|
|
class SOP1_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo <
|
|
|
|
opName, (outs SReg_32:$sdst),
|
|
|
|
!if(tied_in, (ins SSrc_b32:$src0, SReg_32:$sdst_in),
|
|
|
|
(ins SSrc_b32:$src0)),
|
|
|
|
"$sdst, $src0", pattern> {
|
|
|
|
let Constraints = !if(tied_in, "$sdst = $sdst_in", "");
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2016-10-13 02:00:51 +08:00
|
|
|
// 32-bit input, no output.
|
|
|
|
class SOP1_0_32 <string opName, list<dag> pattern = []> : SOP1_Pseudo <
|
|
|
|
opName, (outs), (ins SSrc_b32:$src0),
|
|
|
|
"$src0", pattern> {
|
|
|
|
let has_sdst = 0;
|
|
|
|
}
|
|
|
|
|
2017-04-12 20:40:19 +08:00
|
|
|
class SOP1_0_32R <string opName, list<dag> pattern = []> : SOP1_Pseudo <
|
|
|
|
opName, (outs), (ins SReg_32:$src0),
|
|
|
|
"$src0", pattern> {
|
|
|
|
let has_sdst = 0;
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
class SOP1_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $src0", pattern
|
|
|
|
>;
|
|
|
|
|
|
|
|
// 64-bit input, 32-bit output.
|
|
|
|
class SOP1_32_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
opName, (outs SReg_32:$sdst), (ins SSrc_b64:$src0),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $src0", pattern
|
|
|
|
>;
|
|
|
|
|
|
|
|
// 32-bit input, 64-bit output.
|
2019-02-26 03:24:46 +08:00
|
|
|
class SOP1_64_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo <
|
|
|
|
opName, (outs SReg_64:$sdst),
|
|
|
|
!if(tied_in, (ins SSrc_b32:$src0, SReg_64:$sdst_in),
|
|
|
|
(ins SSrc_b32:$src0)),
|
|
|
|
"$sdst, $src0", pattern> {
|
|
|
|
let Constraints = !if(tied_in, "$sdst = $sdst_in", "");
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
// no input, 64-bit output.
|
|
|
|
class SOP1_64_0 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
|
|
|
|
opName, (outs SReg_64:$sdst), (ins), "$sdst", pattern> {
|
|
|
|
let has_src0 = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// 64-bit input, no output
|
|
|
|
class SOP1_1 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
|
|
|
|
opName, (outs), (ins SReg_64:$src0), "$src0", pattern> {
|
|
|
|
let has_sdst = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
let isMoveImm = 1 in {
|
|
|
|
let isReMaterializable = 1, isAsCheapAsAMove = 1 in {
|
|
|
|
def S_MOV_B32 : SOP1_32 <"s_mov_b32">;
|
|
|
|
def S_MOV_B64 : SOP1_64 <"s_mov_b64">;
|
|
|
|
} // End isRematerializeable = 1
|
|
|
|
|
|
|
|
let Uses = [SCC] in {
|
|
|
|
def S_CMOV_B32 : SOP1_32 <"s_cmov_b32">;
|
|
|
|
def S_CMOV_B64 : SOP1_64 <"s_cmov_b64">;
|
|
|
|
} // End Uses = [SCC]
|
|
|
|
} // End isMoveImm = 1
|
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
|
|
|
def S_NOT_B32 : SOP1_32 <"s_not_b32",
|
|
|
|
[(set i32:$sdst, (not i32:$src0))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_NOT_B64 : SOP1_64 <"s_not_b64",
|
|
|
|
[(set i64:$sdst, (not i64:$src0))]
|
|
|
|
>;
|
|
|
|
def S_WQM_B32 : SOP1_32 <"s_wqm_b32">;
|
2017-10-24 18:26:59 +08:00
|
|
|
def S_WQM_B64 : SOP1_64 <"s_wqm_b64",
|
|
|
|
[(set i1:$sdst, (int_amdgcn_wqm_vote i1:$src0))]
|
|
|
|
>;
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
|
|
|
|
def S_BREV_B32 : SOP1_32 <"s_brev_b32",
|
|
|
|
[(set i32:$sdst, (bitreverse i32:$src0))]
|
|
|
|
>;
|
|
|
|
def S_BREV_B64 : SOP1_64 <"s_brev_b64">;
|
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
|
|
|
def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32">;
|
|
|
|
def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64">;
|
|
|
|
def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32",
|
|
|
|
[(set i32:$sdst, (ctpop i32:$src0))]
|
|
|
|
>;
|
|
|
|
def S_BCNT1_I32_B64 : SOP1_32_64 <"s_bcnt1_i32_b64">;
|
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
def S_FF0_I32_B32 : SOP1_32 <"s_ff0_i32_b32">;
|
|
|
|
def S_FF0_I32_B64 : SOP1_32_64 <"s_ff0_i32_b64">;
|
2017-10-13 03:37:14 +08:00
|
|
|
def S_FF1_I32_B64 : SOP1_32_64 <"s_ff1_i32_b64">;
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_FF1_I32_B32 : SOP1_32 <"s_ff1_i32_b32",
|
2017-10-13 03:37:14 +08:00
|
|
|
[(set i32:$sdst, (AMDGPUffbl_b32 i32:$src0))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
def S_FLBIT_I32_B32 : SOP1_32 <"s_flbit_i32_b32",
|
|
|
|
[(set i32:$sdst, (AMDGPUffbh_u32 i32:$src0))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_FLBIT_I32_B64 : SOP1_32_64 <"s_flbit_i32_b64">;
|
|
|
|
def S_FLBIT_I32 : SOP1_32 <"s_flbit_i32",
|
|
|
|
[(set i32:$sdst, (AMDGPUffbh_i32 i32:$src0))]
|
|
|
|
>;
|
|
|
|
def S_FLBIT_I32_I64 : SOP1_32_64 <"s_flbit_i32_i64">;
|
|
|
|
def S_SEXT_I32_I8 : SOP1_32 <"s_sext_i32_i8",
|
|
|
|
[(set i32:$sdst, (sext_inreg i32:$src0, i8))]
|
|
|
|
>;
|
|
|
|
def S_SEXT_I32_I16 : SOP1_32 <"s_sext_i32_i16",
|
|
|
|
[(set i32:$sdst, (sext_inreg i32:$src0, i16))]
|
|
|
|
>;
|
|
|
|
|
2019-02-26 03:24:46 +08:00
|
|
|
def S_BITSET0_B32 : SOP1_32 <"s_bitset0_b32", [], 1>;
|
|
|
|
def S_BITSET0_B64 : SOP1_64_32 <"s_bitset0_b64", [], 1>;
|
|
|
|
def S_BITSET1_B32 : SOP1_32 <"s_bitset1_b32", [], 1>;
|
|
|
|
def S_BITSET1_B64 : SOP1_64_32 <"s_bitset1_b64", [], 1>;
|
2017-05-27 04:38:26 +08:00
|
|
|
def S_GETPC_B64 : SOP1_64_0 <"s_getpc_b64",
|
|
|
|
[(set i64:$sdst, (int_amdgcn_s_getpc))]
|
|
|
|
>;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2017-05-18 05:56:25 +08:00
|
|
|
let isTerminator = 1, isBarrier = 1, SchedRW = [WriteBranch] in {
|
|
|
|
|
|
|
|
let isBranch = 1, isIndirectBranch = 1 in {
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_SETPC_B64 : SOP1_1 <"s_setpc_b64">;
|
2017-05-18 05:56:25 +08:00
|
|
|
} // End isBranch = 1, isIndirectBranch = 1
|
|
|
|
|
|
|
|
let isReturn = 1 in {
|
|
|
|
// Define variant marked as return rather than branch.
|
|
|
|
def S_SETPC_B64_return : SOP1_1<"", [(AMDGPUret_flag i64:$src0)]>;
|
|
|
|
}
|
|
|
|
} // End isTerminator = 1, isBarrier = 1
|
|
|
|
|
|
|
|
let isCall = 1 in {
|
|
|
|
def S_SWAPPC_B64 : SOP1_64 <"s_swappc_b64"
|
|
|
|
>;
|
2016-08-30 23:20:31 +08:00
|
|
|
}
|
2017-05-18 05:56:25 +08:00
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_RFE_B64 : SOP1_1 <"s_rfe_b64">;
|
|
|
|
|
|
|
|
let hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] in {
|
|
|
|
|
|
|
|
def S_AND_SAVEEXEC_B64 : SOP1_64 <"s_and_saveexec_b64">;
|
|
|
|
def S_OR_SAVEEXEC_B64 : SOP1_64 <"s_or_saveexec_b64">;
|
|
|
|
def S_XOR_SAVEEXEC_B64 : SOP1_64 <"s_xor_saveexec_b64">;
|
|
|
|
def S_ANDN2_SAVEEXEC_B64 : SOP1_64 <"s_andn2_saveexec_b64">;
|
|
|
|
def S_ORN2_SAVEEXEC_B64 : SOP1_64 <"s_orn2_saveexec_b64">;
|
|
|
|
def S_NAND_SAVEEXEC_B64 : SOP1_64 <"s_nand_saveexec_b64">;
|
|
|
|
def S_NOR_SAVEEXEC_B64 : SOP1_64 <"s_nor_saveexec_b64">;
|
|
|
|
def S_XNOR_SAVEEXEC_B64 : SOP1_64 <"s_xnor_saveexec_b64">;
|
|
|
|
|
|
|
|
} // End hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC]
|
|
|
|
|
|
|
|
def S_QUADMASK_B32 : SOP1_32 <"s_quadmask_b32">;
|
|
|
|
def S_QUADMASK_B64 : SOP1_64 <"s_quadmask_b64">;
|
|
|
|
|
|
|
|
let Uses = [M0] in {
|
|
|
|
def S_MOVRELS_B32 : SOP1_32 <"s_movrels_b32">;
|
|
|
|
def S_MOVRELS_B64 : SOP1_64 <"s_movrels_b64">;
|
|
|
|
def S_MOVRELD_B32 : SOP1_32 <"s_movreld_b32">;
|
|
|
|
def S_MOVRELD_B64 : SOP1_64 <"s_movreld_b64">;
|
|
|
|
} // End Uses = [M0]
|
|
|
|
|
2017-04-12 20:40:19 +08:00
|
|
|
def S_CBRANCH_JOIN : SOP1_0_32R <"s_cbranch_join">;
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_MOV_REGRD_B32 : SOP1_32 <"s_mov_regrd_b32">;
|
|
|
|
let Defs = [SCC] in {
|
|
|
|
def S_ABS_I32 : SOP1_32 <"s_abs_i32">;
|
|
|
|
} // End Defs = [SCC]
|
|
|
|
def S_MOV_FED_B32 : SOP1_32 <"s_mov_fed_b32">;
|
|
|
|
|
2016-10-13 02:00:51 +08:00
|
|
|
let SubtargetPredicate = HasVGPRIndexMode in {
|
|
|
|
def S_SET_GPR_IDX_IDX : SOP1_0_32<"s_set_gpr_idx_idx"> {
|
|
|
|
let Uses = [M0];
|
|
|
|
let Defs = [M0];
|
|
|
|
}
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isGFX9 in {
|
2018-04-07 00:35:11 +08:00
|
|
|
let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in {
|
|
|
|
def S_ANDN1_SAVEEXEC_B64 : SOP1_64<"s_andn1_saveexec_b64">;
|
|
|
|
def S_ORN1_SAVEEXEC_B64 : SOP1_64<"s_orn1_saveexec_b64">;
|
|
|
|
def S_ANDN1_WREXEC_B64 : SOP1_64<"s_andn1_wrexec_b64">;
|
|
|
|
def S_ANDN2_WREXEC_B64 : SOP1_64<"s_andn2_wrexec_b64">;
|
|
|
|
} // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC]
|
|
|
|
|
|
|
|
def S_BITREPLICATE_B64_B32 : SOP1_64_32<"s_bitreplicate_b64_b32">;
|
2019-02-23 07:21:06 +08:00
|
|
|
} // End SubtargetPredicate = isGFX9
|
2018-04-07 00:35:11 +08:00
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOP2 Instructions
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
class SOP2_Pseudo<string opName, dag outs, dag ins,
|
|
|
|
string asmOps, list<dag> pattern=[]> :
|
2018-03-26 21:56:53 +08:00
|
|
|
SOP_Pseudo<opName, outs, ins, asmOps, pattern> {
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
let mayLoad = 0;
|
|
|
|
let mayStore = 0;
|
|
|
|
let hasSideEffects = 0;
|
|
|
|
let SALU = 1;
|
|
|
|
let SOP2 = 1;
|
|
|
|
let SchedRW = [WriteSALU];
|
|
|
|
let UseNamedOperandTable = 1;
|
|
|
|
|
2018-03-26 21:56:53 +08:00
|
|
|
let has_sdst = 1;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
// Pseudo instructions have no encodings, but adding this field here allows
|
|
|
|
// us to do:
|
|
|
|
// let sdst = xxx in {
|
|
|
|
// for multiclasses that include both real and pseudo instructions.
|
|
|
|
// field bits<7> sdst = 0;
|
|
|
|
// let Size = 4; // Do we need size here?
|
|
|
|
}
|
|
|
|
|
2018-03-26 21:56:53 +08:00
|
|
|
class SOP2_Real<bits<7> op, SOP_Pseudo ps> :
|
2016-08-30 23:20:31 +08:00
|
|
|
InstSI <ps.OutOperandList, ps.InOperandList,
|
|
|
|
ps.Mnemonic # " " # ps.AsmOperands, []>,
|
|
|
|
Enc32 {
|
|
|
|
let isPseudo = 0;
|
|
|
|
let isCodeGenOnly = 0;
|
|
|
|
|
|
|
|
// copy relevant pseudo op flags
|
|
|
|
let SubtargetPredicate = ps.SubtargetPredicate;
|
|
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
2019-01-18 21:57:43 +08:00
|
|
|
let UseNamedOperandTable = ps.UseNamedOperandTable;
|
|
|
|
let TSFlags = ps.TSFlags;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
// encoding
|
|
|
|
bits<7> sdst;
|
|
|
|
bits<8> src0;
|
|
|
|
bits<8> src1;
|
|
|
|
|
|
|
|
let Inst{7-0} = src0;
|
|
|
|
let Inst{15-8} = src1;
|
|
|
|
let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
|
|
|
|
let Inst{29-23} = op;
|
|
|
|
let Inst{31-30} = 0x2; // encoding
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
class SOP2_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $src0, $src1", pattern
|
|
|
|
>;
|
|
|
|
|
|
|
|
class SOP2_64 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $src0, $src1", pattern
|
|
|
|
>;
|
|
|
|
|
|
|
|
class SOP2_64_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b32:$src1),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $src0, $src1", pattern
|
|
|
|
>;
|
|
|
|
|
|
|
|
class SOP2_64_32_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $src0, $src1", pattern
|
|
|
|
>;
|
|
|
|
|
2018-11-30 00:05:38 +08:00
|
|
|
class UniformUnaryFrag<SDPatternOperator Op> : PatFrag <
|
|
|
|
(ops node:$src0),
|
|
|
|
(Op $src0),
|
|
|
|
[{ return !N->isDivergent(); }]
|
|
|
|
>;
|
|
|
|
|
2018-09-21 18:31:22 +08:00
|
|
|
class UniformBinFrag<SDPatternOperator Op> : PatFrag <
|
|
|
|
(ops node:$src0, node:$src1),
|
|
|
|
(Op $src0, $src1),
|
|
|
|
[{ return !N->isDivergent(); }]
|
|
|
|
>;
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
let Defs = [SCC] in { // Carry out goes to SCC
|
|
|
|
let isCommutable = 1 in {
|
|
|
|
def S_ADD_U32 : SOP2_32 <"s_add_u32">;
|
|
|
|
def S_ADD_I32 : SOP2_32 <"s_add_i32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<add> SSrc_b32:$src0, SSrc_b32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
} // End isCommutable = 1
|
|
|
|
|
|
|
|
def S_SUB_U32 : SOP2_32 <"s_sub_u32">;
|
|
|
|
def S_SUB_I32 : SOP2_32 <"s_sub_i32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<sub> SSrc_b32:$src0, SSrc_b32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
let Uses = [SCC] in { // Carry in comes from SCC
|
|
|
|
let isCommutable = 1 in {
|
|
|
|
def S_ADDC_U32 : SOP2_32 <"s_addc_u32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<adde> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End isCommutable = 1
|
|
|
|
|
|
|
|
def S_SUBB_U32 : SOP2_32 <"s_subb_u32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<sube> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End Uses = [SCC]
|
|
|
|
|
2016-09-07 14:25:55 +08:00
|
|
|
|
|
|
|
let isCommutable = 1 in {
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_MIN_I32 : SOP2_32 <"s_min_i32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<smin> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_MIN_U32 : SOP2_32 <"s_min_u32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<umin> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_MAX_I32 : SOP2_32 <"s_max_i32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<smax> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_MAX_U32 : SOP2_32 <"s_max_u32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<umax> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
2016-09-07 14:25:55 +08:00
|
|
|
} // End isCommutable = 1
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
|
|
|
|
let Uses = [SCC] in {
|
|
|
|
def S_CSELECT_B32 : SOP2_32 <"s_cselect_b32">;
|
|
|
|
def S_CSELECT_B64 : SOP2_64 <"s_cselect_b64">;
|
|
|
|
} // End Uses = [SCC]
|
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
2016-09-07 14:25:55 +08:00
|
|
|
let isCommutable = 1 in {
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_AND_B32 : SOP2_32 <"s_and_b32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<and> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
def S_AND_B64 : SOP2_64 <"s_and_b64",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i64:$sdst, (UniformBinFrag<and> i64:$src0, i64:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
def S_OR_B32 : SOP2_32 <"s_or_b32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<or> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
def S_OR_B64 : SOP2_64 <"s_or_b64",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i64:$sdst, (UniformBinFrag<or> i64:$src0, i64:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
def S_XOR_B32 : SOP2_32 <"s_xor_b32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<xor> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
def S_XOR_B64 : SOP2_64 <"s_xor_b64",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i64:$sdst, (UniformBinFrag<xor> i64:$src0, i64:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
2017-09-19 05:22:45 +08:00
|
|
|
|
|
|
|
def S_XNOR_B32 : SOP2_32 <"s_xnor_b32",
|
|
|
|
[(set i32:$sdst, (not (xor_oneuse i32:$src0, i32:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_XNOR_B64 : SOP2_64 <"s_xnor_b64",
|
|
|
|
[(set i64:$sdst, (not (xor_oneuse i64:$src0, i64:$src1)))]
|
|
|
|
>;
|
2018-11-30 00:05:38 +08:00
|
|
|
|
|
|
|
def S_NAND_B32 : SOP2_32 <"s_nand_b32",
|
|
|
|
[(set i32:$sdst, (not (and_oneuse i32:$src0, i32:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_NAND_B64 : SOP2_64 <"s_nand_b64",
|
|
|
|
[(set i64:$sdst, (not (and_oneuse i64:$src0, i64:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_NOR_B32 : SOP2_32 <"s_nor_b32",
|
|
|
|
[(set i32:$sdst, (not (or_oneuse i32:$src0, i32:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_NOR_B64 : SOP2_64 <"s_nor_b64",
|
|
|
|
[(set i64:$sdst, (not (or_oneuse i64:$src0, i64:$src1)))]
|
|
|
|
>;
|
2016-09-07 14:25:55 +08:00
|
|
|
} // End isCommutable = 1
|
|
|
|
|
2018-11-30 00:05:38 +08:00
|
|
|
def S_ANDN2_B32 : SOP2_32 <"s_andn2_b32",
|
|
|
|
[(set i32:$sdst, (UniformBinFrag<and> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_ANDN2_B64 : SOP2_64 <"s_andn2_b64",
|
|
|
|
[(set i64:$sdst, (UniformBinFrag<and> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_ORN2_B32 : SOP2_32 <"s_orn2_b32",
|
|
|
|
[(set i32:$sdst, (UniformBinFrag<or> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))]
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_ORN2_B64 : SOP2_64 <"s_orn2_b64",
|
|
|
|
[(set i64:$sdst, (UniformBinFrag<or> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))]
|
|
|
|
>;
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
// Use added complexity so these patterns are preferred to the VALU patterns.
|
|
|
|
let AddedComplexity = 1 in {
|
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
2018-09-21 18:31:22 +08:00
|
|
|
// TODO: b64 versions require VOP3 change since v_lshlrev_b64 is VOP3
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_LSHL_B32 : SOP2_32 <"s_lshl_b32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<shl> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_LSHL_B64 : SOP2_64_32 <"s_lshl_b64",
|
2018-10-01 19:06:35 +08:00
|
|
|
[(set i64:$sdst, (UniformBinFrag<shl> i64:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_LSHR_B32 : SOP2_32 <"s_lshr_b32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<srl> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_LSHR_B64 : SOP2_64_32 <"s_lshr_b64",
|
2018-10-01 19:06:35 +08:00
|
|
|
[(set i64:$sdst, (UniformBinFrag<srl> i64:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_ASHR_I32 : SOP2_32 <"s_ashr_i32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<sra> i32:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
def S_ASHR_I64 : SOP2_64_32 <"s_ashr_i64",
|
2018-10-01 19:06:35 +08:00
|
|
|
[(set i64:$sdst, (UniformBinFrag<sra> i64:$src0, i32:$src1))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
def S_BFM_B32 : SOP2_32 <"s_bfm_b32",
|
2018-09-21 18:31:22 +08:00
|
|
|
[(set i32:$sdst, (UniformBinFrag<AMDGPUbfm> i32:$src0, i32:$src1))]>;
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_BFM_B64 : SOP2_64_32_32 <"s_bfm_b64">;
|
2018-09-21 18:31:22 +08:00
|
|
|
|
|
|
|
// TODO: S_MUL_I32 require V_MUL_LO_I32 from VOP3 change
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_MUL_I32 : SOP2_32 <"s_mul_i32",
|
2016-09-07 14:25:55 +08:00
|
|
|
[(set i32:$sdst, (mul i32:$src0, i32:$src1))]> {
|
|
|
|
let isCommutable = 1;
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
} // End AddedComplexity = 1
|
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
|
|
|
def S_BFE_U32 : SOP2_32 <"s_bfe_u32">;
|
|
|
|
def S_BFE_I32 : SOP2_32 <"s_bfe_i32">;
|
|
|
|
def S_BFE_U64 : SOP2_64_32 <"s_bfe_u64">;
|
|
|
|
def S_BFE_I64 : SOP2_64_32 <"s_bfe_i64">;
|
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
def S_CBRANCH_G_FORK : SOP2_Pseudo <
|
|
|
|
"s_cbranch_g_fork", (outs),
|
2017-04-14 19:52:26 +08:00
|
|
|
(ins SCSrc_b64:$src0, SCSrc_b64:$src1),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$src0, $src1"
|
|
|
|
> {
|
|
|
|
let has_sdst = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
|
|
|
def S_ABSDIFF_I32 : SOP2_32 <"s_absdiff_i32">;
|
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isVI in {
|
2017-04-13 01:10:07 +08:00
|
|
|
def S_RFE_RESTORE_B64 : SOP2_Pseudo <
|
|
|
|
"s_rfe_restore_b64", (outs),
|
|
|
|
(ins SSrc_b64:$src0, SSrc_b32:$src1),
|
|
|
|
"$src0, $src1"
|
|
|
|
> {
|
|
|
|
let hasSideEffects = 1;
|
|
|
|
let has_sdst = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isGFX9 in {
|
2017-02-28 02:49:11 +08:00
|
|
|
def S_PACK_LL_B32_B16 : SOP2_32<"s_pack_ll_b32_b16">;
|
|
|
|
def S_PACK_LH_B32_B16 : SOP2_32<"s_pack_lh_b32_b16">;
|
|
|
|
def S_PACK_HH_B32_B16 : SOP2_32<"s_pack_hh_b32_b16">;
|
2018-04-09 21:10:33 +08:00
|
|
|
|
|
|
|
let Defs = [SCC] in {
|
|
|
|
def S_LSHL1_ADD_U32 : SOP2_32<"s_lshl1_add_u32">;
|
|
|
|
def S_LSHL2_ADD_U32 : SOP2_32<"s_lshl2_add_u32">;
|
|
|
|
def S_LSHL3_ADD_U32 : SOP2_32<"s_lshl3_add_u32">;
|
|
|
|
def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32">;
|
|
|
|
} // End Defs = [SCC]
|
|
|
|
|
|
|
|
def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32">;
|
|
|
|
def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32">;
|
2017-02-28 02:49:11 +08:00
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOPK Instructions
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
class SOPK_Pseudo <string opName, dag outs, dag ins,
|
|
|
|
string asmOps, list<dag> pattern=[]> :
|
|
|
|
InstSI <outs, ins, "", pattern>,
|
|
|
|
SIMCInstr<opName, SIEncodingFamily.NONE> {
|
|
|
|
let isPseudo = 1;
|
|
|
|
let isCodeGenOnly = 1;
|
|
|
|
let mayLoad = 0;
|
|
|
|
let mayStore = 0;
|
|
|
|
let hasSideEffects = 0;
|
|
|
|
let SALU = 1;
|
|
|
|
let SOPK = 1;
|
|
|
|
let SchedRW = [WriteSALU];
|
|
|
|
let UseNamedOperandTable = 1;
|
|
|
|
string Mnemonic = opName;
|
|
|
|
string AsmOperands = asmOps;
|
|
|
|
|
|
|
|
bits<1> has_sdst = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOPK_Real<bits<5> op, SOPK_Pseudo ps> :
|
|
|
|
InstSI <ps.OutOperandList, ps.InOperandList,
|
|
|
|
ps.Mnemonic # " " # ps.AsmOperands, []> {
|
|
|
|
let isPseudo = 0;
|
|
|
|
let isCodeGenOnly = 0;
|
|
|
|
|
|
|
|
// copy relevant pseudo op flags
|
|
|
|
let SubtargetPredicate = ps.SubtargetPredicate;
|
|
|
|
let AsmMatchConverter = ps.AsmMatchConverter;
|
|
|
|
let DisableEncoding = ps.DisableEncoding;
|
|
|
|
let Constraints = ps.Constraints;
|
|
|
|
|
|
|
|
// encoding
|
|
|
|
bits<7> sdst;
|
|
|
|
bits<16> simm16;
|
|
|
|
bits<32> imm;
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOPK_Real32<bits<5> op, SOPK_Pseudo ps> :
|
|
|
|
SOPK_Real <op, ps>,
|
|
|
|
Enc32 {
|
|
|
|
let Inst{15-0} = simm16;
|
|
|
|
let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
|
|
|
|
let Inst{27-23} = op;
|
|
|
|
let Inst{31-28} = 0xb; //encoding
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOPK_Real64<bits<5> op, SOPK_Pseudo ps> :
|
|
|
|
SOPK_Real<op, ps>,
|
|
|
|
Enc64 {
|
|
|
|
let Inst{15-0} = simm16;
|
|
|
|
let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
|
|
|
|
let Inst{27-23} = op;
|
|
|
|
let Inst{31-28} = 0xb; //encoding
|
|
|
|
let Inst{63-32} = imm;
|
|
|
|
}
|
|
|
|
|
2016-09-17 05:41:16 +08:00
|
|
|
class SOPKInstTable <bit is_sopk, string cmpOp = ""> {
|
|
|
|
bit IsSOPK = is_sopk;
|
|
|
|
string BaseCmpOp = cmpOp;
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
class SOPK_32 <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
|
|
|
|
opName,
|
|
|
|
(outs SReg_32:$sdst),
|
2017-04-26 23:34:19 +08:00
|
|
|
(ins s16imm:$simm16),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $simm16",
|
|
|
|
pattern>;
|
|
|
|
|
2017-04-26 23:34:19 +08:00
|
|
|
class SOPK_SCC <string opName, string base_op, bit isSignExt> : SOPK_Pseudo <
|
2016-08-30 23:20:31 +08:00
|
|
|
opName,
|
|
|
|
(outs),
|
2017-04-26 23:34:19 +08:00
|
|
|
!if(isSignExt,
|
|
|
|
(ins SReg_32:$sdst, s16imm:$simm16),
|
|
|
|
(ins SReg_32:$sdst, u16imm:$simm16)),
|
2016-09-17 05:41:16 +08:00
|
|
|
"$sdst, $simm16", []>,
|
|
|
|
SOPKInstTable<1, base_op>{
|
2016-08-30 23:20:31 +08:00
|
|
|
let Defs = [SCC];
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOPK_32TIE <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
|
|
|
|
opName,
|
|
|
|
(outs SReg_32:$sdst),
|
2017-04-26 23:34:19 +08:00
|
|
|
(ins SReg_32:$src0, s16imm:$simm16),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $simm16",
|
|
|
|
pattern
|
|
|
|
>;
|
|
|
|
|
|
|
|
let isReMaterializable = 1, isMoveImm = 1 in {
|
|
|
|
def S_MOVK_I32 : SOPK_32 <"s_movk_i32">;
|
|
|
|
} // End isReMaterializable = 1
|
|
|
|
let Uses = [SCC] in {
|
|
|
|
def S_CMOVK_I32 : SOPK_32 <"s_cmovk_i32">;
|
|
|
|
}
|
|
|
|
|
|
|
|
let isCompare = 1 in {
|
|
|
|
|
|
|
|
// This instruction is disabled for now until we can figure out how to teach
|
|
|
|
// the instruction selector to correctly use the S_CMP* vs V_CMP*
|
|
|
|
// instructions.
|
|
|
|
//
|
|
|
|
// When this instruction is enabled the code generator sometimes produces this
|
|
|
|
// invalid sequence:
|
|
|
|
//
|
|
|
|
// SCC = S_CMPK_EQ_I32 SGPR0, imm
|
|
|
|
// VCC = COPY SCC
|
|
|
|
// VGPR0 = V_CNDMASK VCC, VGPR0, VGPR1
|
|
|
|
//
|
|
|
|
// def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32",
|
|
|
|
// [(set i1:$dst, (setcc i32:$src0, imm:$src1, SETEQ))]
|
|
|
|
// >;
|
|
|
|
|
2017-04-26 23:34:19 +08:00
|
|
|
def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", "s_cmp_eq_i32", 1>;
|
|
|
|
def S_CMPK_LG_I32 : SOPK_SCC <"s_cmpk_lg_i32", "s_cmp_lg_i32", 1>;
|
|
|
|
def S_CMPK_GT_I32 : SOPK_SCC <"s_cmpk_gt_i32", "s_cmp_gt_i32", 1>;
|
|
|
|
def S_CMPK_GE_I32 : SOPK_SCC <"s_cmpk_ge_i32", "s_cmp_ge_i32", 1>;
|
|
|
|
def S_CMPK_LT_I32 : SOPK_SCC <"s_cmpk_lt_i32", "s_cmp_lt_i32", 1>;
|
|
|
|
def S_CMPK_LE_I32 : SOPK_SCC <"s_cmpk_le_i32", "s_cmp_le_i32", 1>;
|
2016-09-17 05:41:16 +08:00
|
|
|
|
|
|
|
let SOPKZext = 1 in {
|
2017-04-26 23:34:19 +08:00
|
|
|
def S_CMPK_EQ_U32 : SOPK_SCC <"s_cmpk_eq_u32", "s_cmp_eq_u32", 0>;
|
|
|
|
def S_CMPK_LG_U32 : SOPK_SCC <"s_cmpk_lg_u32", "s_cmp_lg_u32", 0>;
|
|
|
|
def S_CMPK_GT_U32 : SOPK_SCC <"s_cmpk_gt_u32", "s_cmp_gt_u32", 0>;
|
|
|
|
def S_CMPK_GE_U32 : SOPK_SCC <"s_cmpk_ge_u32", "s_cmp_ge_u32", 0>;
|
|
|
|
def S_CMPK_LT_U32 : SOPK_SCC <"s_cmpk_lt_u32", "s_cmp_lt_u32", 0>;
|
|
|
|
def S_CMPK_LE_U32 : SOPK_SCC <"s_cmpk_le_u32", "s_cmp_le_u32", 0>;
|
2016-09-17 05:41:16 +08:00
|
|
|
} // End SOPKZext = 1
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End isCompare = 1
|
|
|
|
|
|
|
|
let Defs = [SCC], isCommutable = 1, DisableEncoding = "$src0",
|
|
|
|
Constraints = "$sdst = $src0" in {
|
|
|
|
def S_ADDK_I32 : SOPK_32TIE <"s_addk_i32">;
|
|
|
|
def S_MULK_I32 : SOPK_32TIE <"s_mulk_i32">;
|
|
|
|
}
|
|
|
|
|
|
|
|
def S_CBRANCH_I_FORK : SOPK_Pseudo <
|
|
|
|
"s_cbranch_i_fork",
|
2017-04-26 23:34:19 +08:00
|
|
|
(outs), (ins SReg_64:$sdst, s16imm:$simm16),
|
2016-08-30 23:20:31 +08:00
|
|
|
"$sdst, $simm16"
|
|
|
|
>;
|
|
|
|
|
|
|
|
let mayLoad = 1 in {
|
|
|
|
def S_GETREG_B32 : SOPK_Pseudo <
|
|
|
|
"s_getreg_b32",
|
|
|
|
(outs SReg_32:$sdst), (ins hwreg:$simm16),
|
|
|
|
"$sdst, $simm16"
|
|
|
|
>;
|
|
|
|
}
|
|
|
|
|
2016-12-07 10:42:15 +08:00
|
|
|
let hasSideEffects = 1 in {
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_SETREG_B32 : SOPK_Pseudo <
|
|
|
|
"s_setreg_b32",
|
|
|
|
(outs), (ins SReg_32:$sdst, hwreg:$simm16),
|
2016-12-07 10:42:15 +08:00
|
|
|
"$simm16, $sdst",
|
|
|
|
[(AMDGPUsetreg i32:$sdst, (i16 timm:$simm16))]
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
// FIXME: Not on SI?
|
|
|
|
//def S_GETREG_REGRD_B32 : SOPK_32 <sopk<0x14, 0x13>, "s_getreg_regrd_b32">;
|
|
|
|
|
|
|
|
def S_SETREG_IMM32_B32 : SOPK_Pseudo <
|
|
|
|
"s_setreg_imm32_b32",
|
|
|
|
(outs), (ins i32imm:$imm, hwreg:$simm16),
|
2016-10-06 18:13:23 +08:00
|
|
|
"$simm16, $imm"> {
|
|
|
|
let Size = 8; // Unlike every other SOPK instruction.
|
2016-08-30 23:20:31 +08:00
|
|
|
let has_sdst = 0;
|
|
|
|
}
|
|
|
|
|
2016-12-07 10:42:15 +08:00
|
|
|
} // End hasSideEffects = 1
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isGFX9 in {
|
2018-04-07 02:24:49 +08:00
|
|
|
def S_CALL_B64 : SOPK_Pseudo<
|
|
|
|
"s_call_b64",
|
|
|
|
(outs SReg_64:$sdst),
|
|
|
|
(ins s16imm:$simm16),
|
|
|
|
"$sdst, $simm16"> {
|
|
|
|
let isCall = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOPC Instructions
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
class SOPCe <bits<7> op> : Enc32 {
|
|
|
|
bits<8> src0;
|
|
|
|
bits<8> src1;
|
|
|
|
|
|
|
|
let Inst{7-0} = src0;
|
|
|
|
let Inst{15-8} = src1;
|
|
|
|
let Inst{22-16} = op;
|
|
|
|
let Inst{31-23} = 0x17e;
|
|
|
|
}
|
|
|
|
|
2016-10-13 02:00:51 +08:00
|
|
|
class SOPC <bits<7> op, dag outs, dag ins, string asm,
|
|
|
|
list<dag> pattern = []> :
|
2016-08-30 23:20:31 +08:00
|
|
|
InstSI<outs, ins, asm, pattern>, SOPCe <op> {
|
|
|
|
let mayLoad = 0;
|
|
|
|
let mayStore = 0;
|
|
|
|
let hasSideEffects = 0;
|
|
|
|
let SALU = 1;
|
|
|
|
let SOPC = 1;
|
|
|
|
let isCodeGenOnly = 0;
|
|
|
|
let Defs = [SCC];
|
|
|
|
let SchedRW = [WriteSALU];
|
|
|
|
let UseNamedOperandTable = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOPC_Base <bits<7> op, RegisterOperand rc0, RegisterOperand rc1,
|
|
|
|
string opName, list<dag> pattern = []> : SOPC <
|
|
|
|
op, (outs), (ins rc0:$src0, rc1:$src1),
|
|
|
|
opName#" $src0, $src1", pattern > {
|
|
|
|
let Defs = [SCC];
|
|
|
|
}
|
|
|
|
class SOPC_Helper <bits<7> op, RegisterOperand rc, ValueType vt,
|
|
|
|
string opName, PatLeaf cond> : SOPC_Base <
|
|
|
|
op, rc, rc, opName,
|
|
|
|
[(set SCC, (si_setcc_uniform vt:$src0, vt:$src1, cond))] > {
|
|
|
|
}
|
|
|
|
|
2016-09-17 05:41:16 +08:00
|
|
|
class SOPC_CMP_32<bits<7> op, string opName,
|
|
|
|
PatLeaf cond = COND_NULL, string revOp = opName>
|
|
|
|
: SOPC_Helper<op, SSrc_b32, i32, opName, cond>,
|
|
|
|
Commutable_REV<revOp, !eq(revOp, opName)>,
|
|
|
|
SOPKInstTable<0, opName> {
|
|
|
|
let isCompare = 1;
|
|
|
|
let isCommutable = 1;
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2016-09-17 10:02:19 +08:00
|
|
|
class SOPC_CMP_64<bits<7> op, string opName,
|
|
|
|
PatLeaf cond = COND_NULL, string revOp = opName>
|
|
|
|
: SOPC_Helper<op, SSrc_b64, i64, opName, cond>,
|
|
|
|
Commutable_REV<revOp, !eq(revOp, opName)> {
|
|
|
|
let isCompare = 1;
|
|
|
|
let isCommutable = 1;
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
class SOPC_32<bits<7> op, string opName, list<dag> pattern = []>
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
: SOPC_Base<op, SSrc_b32, SSrc_b32, opName, pattern>;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
class SOPC_64_32<bits<7> op, string opName, list<dag> pattern = []>
|
AMDGPU] Assembler: better support for immediate literals in assembler.
Summary:
Prevously assembler parsed all literals as either 32-bit integers or 32-bit floating-point values. Because of this we couldn't support f64 literals.
E.g. in instruction "v_fract_f64 v[0:1], 0.5", literal 0.5 was encoded as 32-bit literal 0x3f000000, which is incorrect and will be interpreted as 3.0517578125E-5 instead of 0.5. Correct encoding is inline constant 240 (optimal) or 32-bit literal 0x3FE00000 at least.
With this change the way immediate literals are parsed is changed. All literals are always parsed as 64-bit values either integer or floating-point. Then we convert parsed literals to correct form based on information about type of operand parsed (was literal floating or binary) and type of expected instruction operands (is this f32/64 or b32/64 instruction).
Here are rules how we convert literals:
- We parsed fp literal:
- Instruction expects 64-bit operand:
- If parsed literal is inlinable (e.g. v_fract_f64_e32 v[0:1], 0.5)
- then we do nothing this literal
- Else if literal is not-inlinable but instruction requires to inline it (e.g. this is e64 encoding, v_fract_f64_e64 v[0:1], 1.5)
- report error
- Else literal is not-inlinable but we can encode it as additional 32-bit literal constant
- If instruction expect fp operand type (f64)
- Check if low 32 bits of literal are zeroes (e.g. v_fract_f64 v[0:1], 1.5)
- If so then do nothing
- Else (e.g. v_fract_f64 v[0:1], 3.1415)
- report warning that low 32 bits will be set to zeroes and precision will be lost
- set low 32 bits of literal to zeroes
- Instruction expects integer operand type (e.g. s_mov_b64_e32 s[0:1], 1.5)
- report error as it is unclear how to encode this literal
- Instruction expects 32-bit operand:
- Convert parsed 64 bit fp literal to 32 bit fp. Allow lose of precision but not overflow or underflow
- Is this literal inlinable and are we required to inline literal (e.g. v_trunc_f32_e64 v0, 0.5)
- do nothing
- Else report error
- Do nothing. We can encode any other 32-bit fp literal (e.g. v_trunc_f32 v0, 10000000.0)
- Parsed binary literal:
- Is this literal inlinable (e.g. v_trunc_f32_e32 v0, 35)
- do nothing
- Else, are we required to inline this literal (e.g. v_trunc_f32_e64 v0, 35)
- report error
- Else, literal is not-inlinable and we are not required to inline it
- Are high 32 bit of literal zeroes or same as sign bit (32 bit)
- do nothing (e.g. v_trunc_f32 v0, 0xdeadbeef)
- Else
- report error (e.g. v_trunc_f32 v0, 0x123456789abcdef0)
For this change it is required that we know operand types of instruction (are they f32/64 or b32/64). I added several new register operands (they extend previous register operands) and set operand types to corresponding types:
'''
enum OperandType {
OPERAND_REG_IMM32_INT,
OPERAND_REG_IMM32_FP,
OPERAND_REG_INLINE_C_INT,
OPERAND_REG_INLINE_C_FP,
}
'''
This is not working yet:
- Several tests are failing
- Problems with predicate methods for inline immediates
- LLVM generated assembler parts try to select e64 encoding before e32.
More changes are required for several AsmOperands.
Reviewers: vpykhtin, tstellarAMD
Subscribers: arsenm, kzhuravl, artem.tamazov
Differential Revision: https://reviews.llvm.org/D22922
llvm-svn: 281050
2016-09-09 22:44:04 +08:00
|
|
|
: SOPC_Base<op, SSrc_b64, SSrc_b32, opName, pattern>;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2016-09-30 09:50:20 +08:00
|
|
|
def S_CMP_EQ_I32 : SOPC_CMP_32 <0x00, "s_cmp_eq_i32">;
|
|
|
|
def S_CMP_LG_I32 : SOPC_CMP_32 <0x01, "s_cmp_lg_i32">;
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_CMP_GT_I32 : SOPC_CMP_32 <0x02, "s_cmp_gt_i32", COND_SGT>;
|
|
|
|
def S_CMP_GE_I32 : SOPC_CMP_32 <0x03, "s_cmp_ge_i32", COND_SGE>;
|
2016-09-17 05:41:16 +08:00
|
|
|
def S_CMP_LT_I32 : SOPC_CMP_32 <0x04, "s_cmp_lt_i32", COND_SLT, "s_cmp_gt_i32">;
|
|
|
|
def S_CMP_LE_I32 : SOPC_CMP_32 <0x05, "s_cmp_le_i32", COND_SLE, "s_cmp_ge_i32">;
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_CMP_EQ_U32 : SOPC_CMP_32 <0x06, "s_cmp_eq_u32", COND_EQ>;
|
2016-09-17 05:41:16 +08:00
|
|
|
def S_CMP_LG_U32 : SOPC_CMP_32 <0x07, "s_cmp_lg_u32", COND_NE>;
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_CMP_GT_U32 : SOPC_CMP_32 <0x08, "s_cmp_gt_u32", COND_UGT>;
|
|
|
|
def S_CMP_GE_U32 : SOPC_CMP_32 <0x09, "s_cmp_ge_u32", COND_UGE>;
|
2016-09-17 05:41:16 +08:00
|
|
|
def S_CMP_LT_U32 : SOPC_CMP_32 <0x0a, "s_cmp_lt_u32", COND_ULT, "s_cmp_gt_u32">;
|
|
|
|
def S_CMP_LE_U32 : SOPC_CMP_32 <0x0b, "s_cmp_le_u32", COND_ULE, "s_cmp_ge_u32">;
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
def S_BITCMP0_B32 : SOPC_32 <0x0c, "s_bitcmp0_b32">;
|
|
|
|
def S_BITCMP1_B32 : SOPC_32 <0x0d, "s_bitcmp1_b32">;
|
|
|
|
def S_BITCMP0_B64 : SOPC_64_32 <0x0e, "s_bitcmp0_b64">;
|
|
|
|
def S_BITCMP1_B64 : SOPC_64_32 <0x0f, "s_bitcmp1_b64">;
|
|
|
|
def S_SETVSKIP : SOPC_32 <0x10, "s_setvskip">;
|
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isVI in {
|
2016-09-17 10:02:19 +08:00
|
|
|
def S_CMP_EQ_U64 : SOPC_CMP_64 <0x12, "s_cmp_eq_u64", COND_EQ>;
|
|
|
|
def S_CMP_LG_U64 : SOPC_CMP_64 <0x13, "s_cmp_lg_u64", COND_NE>;
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
2016-10-13 02:00:51 +08:00
|
|
|
let SubtargetPredicate = HasVGPRIndexMode in {
|
|
|
|
def S_SET_GPR_IDX_ON : SOPC <0x11,
|
|
|
|
(outs),
|
|
|
|
(ins SSrc_b32:$src0, GPRIdxMode:$src1),
|
|
|
|
"s_set_gpr_idx_on $src0,$src1"> {
|
|
|
|
let Defs = [M0]; // No scc def
|
|
|
|
let Uses = [M0]; // Other bits of m0 unmodified.
|
|
|
|
let hasSideEffects = 1; // Sets mode.gpr_idx_en
|
2016-11-02 04:42:24 +08:00
|
|
|
let FixedSize = 1;
|
2016-10-13 02:00:51 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOPP Instructions
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
class SOPPe <bits<7> op> : Enc32 {
|
|
|
|
bits <16> simm16;
|
|
|
|
|
|
|
|
let Inst{15-0} = simm16;
|
|
|
|
let Inst{22-16} = op;
|
|
|
|
let Inst{31-23} = 0x17f; // encoding
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOPP <bits<7> op, dag ins, string asm, list<dag> pattern = []> :
|
|
|
|
InstSI <(outs), ins, asm, pattern >, SOPPe <op> {
|
|
|
|
|
|
|
|
let mayLoad = 0;
|
|
|
|
let mayStore = 0;
|
|
|
|
let hasSideEffects = 0;
|
|
|
|
let SALU = 1;
|
|
|
|
let SOPP = 1;
|
2016-10-06 18:13:23 +08:00
|
|
|
let Size = 4;
|
2016-08-30 23:20:31 +08:00
|
|
|
let SchedRW = [WriteSALU];
|
|
|
|
|
|
|
|
let UseNamedOperandTable = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
def S_NOP : SOPP <0x00000000, (ins i16imm:$simm16), "s_nop $simm16">;
|
|
|
|
|
|
|
|
let isTerminator = 1 in {
|
|
|
|
|
[AMDGPU] Add support for immediate operand for S_ENDPGM
Summary:
Add support for immediate operand in S_ENDPGM
Change-Id: I0c56a076a10980f719fb2a8f16407e9c301013f6
Reviewers: alexshap
Subscribers: qcolombet, arsenm, kzhuravl, jvesely, wdng, nhaehnle, yaxunl, tpr, t-tye, eraman, arphaman, Petar.Avramovic, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59213
llvm-svn: 355902
2019-03-12 17:52:58 +08:00
|
|
|
def S_ENDPGM : SOPP <0x00000001, (ins EndpgmImm:$simm16), "s_endpgm $simm16"> {
|
2016-08-30 23:20:31 +08:00
|
|
|
let isBarrier = 1;
|
2016-10-29 07:00:38 +08:00
|
|
|
let isReturn = 1;
|
2016-08-30 23:20:31 +08:00
|
|
|
}
|
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isVI in {
|
2017-04-13 01:10:07 +08:00
|
|
|
def S_ENDPGM_SAVED : SOPP <0x0000001B, (ins), "s_endpgm_saved"> {
|
|
|
|
let simm16 = 0;
|
|
|
|
let isBarrier = 1;
|
|
|
|
let isReturn = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isGFX9 in {
|
2018-04-07 01:25:00 +08:00
|
|
|
let isBarrier = 1, isReturn = 1, simm16 = 0 in {
|
|
|
|
def S_ENDPGM_ORDERED_PS_DONE :
|
|
|
|
SOPP<0x01e, (ins), "s_endpgm_ordered_ps_done">;
|
|
|
|
} // End isBarrier = 1, isReturn = 1, simm16 = 0
|
2019-02-23 07:21:06 +08:00
|
|
|
} // End SubtargetPredicate = isGFX9
|
2018-04-07 01:25:00 +08:00
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
let isBranch = 1, SchedRW = [WriteBranch] in {
|
|
|
|
def S_BRANCH : SOPP <
|
|
|
|
0x00000002, (ins sopp_brtarget:$simm16), "s_branch $simm16",
|
|
|
|
[(br bb:$simm16)]> {
|
|
|
|
let isBarrier = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
let Uses = [SCC] in {
|
|
|
|
def S_CBRANCH_SCC0 : SOPP <
|
|
|
|
0x00000004, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_scc0 $simm16"
|
|
|
|
>;
|
|
|
|
def S_CBRANCH_SCC1 : SOPP <
|
|
|
|
0x00000005, (ins sopp_brtarget:$simm16),
|
2017-10-11 04:34:49 +08:00
|
|
|
"s_cbranch_scc1 $simm16"
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
} // End Uses = [SCC]
|
|
|
|
|
|
|
|
let Uses = [VCC] in {
|
|
|
|
def S_CBRANCH_VCCZ : SOPP <
|
|
|
|
0x00000006, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_vccz $simm16"
|
|
|
|
>;
|
|
|
|
def S_CBRANCH_VCCNZ : SOPP <
|
|
|
|
0x00000007, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_vccnz $simm16"
|
|
|
|
>;
|
|
|
|
} // End Uses = [VCC]
|
|
|
|
|
|
|
|
let Uses = [EXEC] in {
|
|
|
|
def S_CBRANCH_EXECZ : SOPP <
|
|
|
|
0x00000008, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_execz $simm16"
|
|
|
|
>;
|
|
|
|
def S_CBRANCH_EXECNZ : SOPP <
|
|
|
|
0x00000009, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_execnz $simm16"
|
|
|
|
>;
|
|
|
|
} // End Uses = [EXEC]
|
|
|
|
|
2017-04-06 01:26:45 +08:00
|
|
|
def S_CBRANCH_CDBGSYS : SOPP <
|
|
|
|
0x00000017, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_cdbgsys $simm16"
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_CBRANCH_CDBGSYS_AND_USER : SOPP <
|
|
|
|
0x0000001A, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_cdbgsys_and_user $simm16"
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_CBRANCH_CDBGSYS_OR_USER : SOPP <
|
|
|
|
0x00000019, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_cdbgsys_or_user $simm16"
|
|
|
|
>;
|
|
|
|
|
|
|
|
def S_CBRANCH_CDBGUSER : SOPP <
|
|
|
|
0x00000018, (ins sopp_brtarget:$simm16),
|
|
|
|
"s_cbranch_cdbguser $simm16"
|
|
|
|
>;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
} // End isBranch = 1
|
|
|
|
} // End isTerminator = 1
|
|
|
|
|
|
|
|
let hasSideEffects = 1 in {
|
|
|
|
def S_BARRIER : SOPP <0x0000000a, (ins), "s_barrier",
|
|
|
|
[(int_amdgcn_s_barrier)]> {
|
|
|
|
let SchedRW = [WriteBarrier];
|
|
|
|
let simm16 = 0;
|
|
|
|
let mayLoad = 1;
|
|
|
|
let mayStore = 1;
|
|
|
|
let isConvergent = 1;
|
|
|
|
}
|
|
|
|
|
2019-02-23 07:21:06 +08:00
|
|
|
let SubtargetPredicate = isVI in {
|
2017-04-13 01:10:07 +08:00
|
|
|
def S_WAKEUP : SOPP <0x00000003, (ins), "s_wakeup"> {
|
|
|
|
let simm16 = 0;
|
|
|
|
let mayLoad = 1;
|
|
|
|
let mayStore = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
let mayLoad = 1, mayStore = 1, hasSideEffects = 1 in
|
|
|
|
def S_WAITCNT : SOPP <0x0000000c, (ins WAIT_FLAG:$simm16), "s_waitcnt $simm16">;
|
|
|
|
def S_SETHALT : SOPP <0x0000000d, (ins i16imm:$simm16), "s_sethalt $simm16">;
|
2017-04-06 01:26:45 +08:00
|
|
|
def S_SETKILL : SOPP <0x0000000b, (ins i16imm:$simm16), "s_setkill $simm16">;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
// On SI the documentation says sleep for approximately 64 * low 2
|
|
|
|
// bits, consistent with the reported maximum of 448. On VI the
|
|
|
|
// maximum reported is 960 cycles, so 960 / 64 = 15 max, so is the
|
|
|
|
// maximum really 15 on VI?
|
|
|
|
def S_SLEEP : SOPP <0x0000000e, (ins i32imm:$simm16),
|
|
|
|
"s_sleep $simm16", [(int_amdgcn_s_sleep SIMM16bit:$simm16)]> {
|
|
|
|
let hasSideEffects = 1;
|
|
|
|
let mayLoad = 1;
|
|
|
|
let mayStore = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
def S_SETPRIO : SOPP <0x0000000f, (ins i16imm:$simm16), "s_setprio $simm16">;
|
|
|
|
|
|
|
|
let Uses = [EXEC, M0] in {
|
|
|
|
// FIXME: Should this be mayLoad+mayStore?
|
|
|
|
def S_SENDMSG : SOPP <0x00000010, (ins SendMsgImm:$simm16), "s_sendmsg $simm16",
|
|
|
|
[(AMDGPUsendmsg (i32 imm:$simm16))]
|
|
|
|
>;
|
2017-01-05 02:06:55 +08:00
|
|
|
|
|
|
|
def S_SENDMSGHALT : SOPP <0x00000011, (ins SendMsgImm:$simm16), "s_sendmsghalt $simm16",
|
|
|
|
[(AMDGPUsendmsghalt (i32 imm:$simm16))]
|
|
|
|
>;
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End Uses = [EXEC, M0]
|
|
|
|
|
|
|
|
def S_TRAP : SOPP <0x00000012, (ins i16imm:$simm16), "s_trap $simm16">;
|
|
|
|
def S_ICACHE_INV : SOPP <0x00000013, (ins), "s_icache_inv"> {
|
|
|
|
let simm16 = 0;
|
|
|
|
}
|
|
|
|
def S_INCPERFLEVEL : SOPP <0x00000014, (ins i32imm:$simm16), "s_incperflevel $simm16",
|
|
|
|
[(int_amdgcn_s_incperflevel SIMM16bit:$simm16)]> {
|
|
|
|
let hasSideEffects = 1;
|
|
|
|
let mayLoad = 1;
|
|
|
|
let mayStore = 1;
|
|
|
|
}
|
|
|
|
def S_DECPERFLEVEL : SOPP <0x00000015, (ins i32imm:$simm16), "s_decperflevel $simm16",
|
|
|
|
[(int_amdgcn_s_decperflevel SIMM16bit:$simm16)]> {
|
|
|
|
let hasSideEffects = 1;
|
|
|
|
let mayLoad = 1;
|
|
|
|
let mayStore = 1;
|
|
|
|
}
|
|
|
|
def S_TTRACEDATA : SOPP <0x00000016, (ins), "s_ttracedata"> {
|
|
|
|
let simm16 = 0;
|
|
|
|
}
|
2016-10-13 02:00:51 +08:00
|
|
|
|
|
|
|
let SubtargetPredicate = HasVGPRIndexMode in {
|
|
|
|
def S_SET_GPR_IDX_OFF : SOPP<0x1c, (ins), "s_set_gpr_idx_off"> {
|
|
|
|
let simm16 = 0;
|
|
|
|
}
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
} // End hasSideEffects
|
|
|
|
|
2016-10-13 02:00:51 +08:00
|
|
|
let SubtargetPredicate = HasVGPRIndexMode in {
|
|
|
|
def S_SET_GPR_IDX_MODE : SOPP<0x1d, (ins GPRIdxMode:$simm16),
|
|
|
|
"s_set_gpr_idx_mode$simm16"> {
|
|
|
|
let Defs = [M0];
|
|
|
|
}
|
|
|
|
}
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// S_GETREG_B32 Intrinsic Pattern.
|
|
|
|
//===----------------------------------------------------------------------===//
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-08-30 23:20:31 +08:00
|
|
|
(int_amdgcn_s_getreg imm:$simm16),
|
|
|
|
(S_GETREG_B32 (as_i16imm $simm16))
|
|
|
|
>;
|
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOP1 Patterns
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
[AMDGPU] Add support for immediate operand for S_ENDPGM
Summary:
Add support for immediate operand in S_ENDPGM
Change-Id: I0c56a076a10980f719fb2a8f16407e9c301013f6
Reviewers: alexshap
Subscribers: qcolombet, arsenm, kzhuravl, jvesely, wdng, nhaehnle, yaxunl, tpr, t-tye, eraman, arphaman, Petar.Avramovic, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59213
llvm-svn: 355902
2019-03-12 17:52:58 +08:00
|
|
|
def : GCNPat <
|
|
|
|
(AMDGPUendpgm),
|
|
|
|
(S_ENDPGM (i16 0))
|
|
|
|
>;
|
|
|
|
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-08-30 23:20:31 +08:00
|
|
|
(i64 (ctpop i64:$src)),
|
|
|
|
(i64 (REG_SEQUENCE SReg_64,
|
|
|
|
(i32 (COPY_TO_REGCLASS (S_BCNT1_I32_B64 $src), SReg_32)), sub0,
|
2016-11-11 00:02:37 +08:00
|
|
|
(S_MOV_B32 (i32 0)), sub1))
|
2016-08-30 23:20:31 +08:00
|
|
|
>;
|
|
|
|
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-08-30 23:20:31 +08:00
|
|
|
(i32 (smax i32:$x, (i32 (ineg i32:$x)))),
|
|
|
|
(S_ABS_I32 $x)
|
|
|
|
>;
|
|
|
|
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-11-11 00:02:37 +08:00
|
|
|
(i16 imm:$imm),
|
|
|
|
(S_MOV_B32 imm:$imm)
|
|
|
|
>;
|
|
|
|
|
|
|
|
// Same as a 32-bit inreg
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat<
|
2016-11-11 00:02:37 +08:00
|
|
|
(i32 (sext i16:$src)),
|
|
|
|
(S_SEXT_I32_I16 $src)
|
|
|
|
>;
|
|
|
|
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOP2 Patterns
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
// V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector
|
|
|
|
// case, the sgpr-copies pass will fix this to use the vector version.
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-08-30 23:20:31 +08:00
|
|
|
(i32 (addc i32:$src0, i32:$src1)),
|
|
|
|
(S_ADD_U32 $src0, $src1)
|
|
|
|
>;
|
|
|
|
|
2016-11-11 00:02:37 +08:00
|
|
|
// FIXME: We need to use COPY_TO_REGCLASS to work-around the fact that
|
|
|
|
// REG_SEQUENCE patterns don't support instructions with multiple
|
|
|
|
// outputs.
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat<
|
2016-11-11 00:02:37 +08:00
|
|
|
(i64 (zext i16:$src)),
|
|
|
|
(REG_SEQUENCE SReg_64,
|
|
|
|
(i32 (COPY_TO_REGCLASS (S_AND_B32 $src, (S_MOV_B32 (i32 0xffff))), SGPR_32)), sub0,
|
|
|
|
(S_MOV_B32 (i32 0)), sub1)
|
|
|
|
>;
|
|
|
|
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-11-11 00:02:37 +08:00
|
|
|
(i64 (sext i16:$src)),
|
|
|
|
(REG_SEQUENCE SReg_64, (i32 (S_SEXT_I32_I16 $src)), sub0,
|
|
|
|
(i32 (COPY_TO_REGCLASS (S_ASHR_I32 (i32 (S_SEXT_I32_I16 $src)), (S_MOV_B32 (i32 31))), SGPR_32)), sub1)
|
|
|
|
>;
|
|
|
|
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat<
|
2016-11-11 00:02:37 +08:00
|
|
|
(i32 (zext i16:$src)),
|
|
|
|
(S_AND_B32 (S_MOV_B32 (i32 0xffff)), $src)
|
|
|
|
>;
|
|
|
|
|
|
|
|
|
|
|
|
|
2016-08-30 23:20:31 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOPP Patterns
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2017-10-03 08:06:41 +08:00
|
|
|
def : GCNPat <
|
2016-08-30 23:20:31 +08:00
|
|
|
(int_amdgcn_s_waitcnt i32:$simm16),
|
|
|
|
(S_WAITCNT (as_i16imm $simm16))
|
|
|
|
>;
|
|
|
|
|
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Real target instructions, move this to the appropriate subtarget TD file
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
class Select_si<string opName> :
|
|
|
|
SIMCInstr<opName, SIEncodingFamily.SI> {
|
2019-02-23 07:21:06 +08:00
|
|
|
list<Predicate> AssemblerPredicates = [isSICI];
|
2016-08-30 23:20:31 +08:00
|
|
|
string DecoderNamespace = "SICI";
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOP1_Real_si<bits<8> op, SOP1_Pseudo ps> :
|
|
|
|
SOP1_Real<op, ps>,
|
|
|
|
Select_si<ps.Mnemonic>;
|
|
|
|
|
|
|
|
class SOP2_Real_si<bits<7> op, SOP2_Pseudo ps> :
|
|
|
|
SOP2_Real<op, ps>,
|
|
|
|
Select_si<ps.Mnemonic>;
|
|
|
|
|
|
|
|
class SOPK_Real_si<bits<5> op, SOPK_Pseudo ps> :
|
|
|
|
SOPK_Real32<op, ps>,
|
|
|
|
Select_si<ps.Mnemonic>;
|
|
|
|
|
|
|
|
def S_MOV_B32_si : SOP1_Real_si <0x03, S_MOV_B32>;
|
|
|
|
def S_MOV_B64_si : SOP1_Real_si <0x04, S_MOV_B64>;
|
|
|
|
def S_CMOV_B32_si : SOP1_Real_si <0x05, S_CMOV_B32>;
|
|
|
|
def S_CMOV_B64_si : SOP1_Real_si <0x06, S_CMOV_B64>;
|
|
|
|
def S_NOT_B32_si : SOP1_Real_si <0x07, S_NOT_B32>;
|
|
|
|
def S_NOT_B64_si : SOP1_Real_si <0x08, S_NOT_B64>;
|
|
|
|
def S_WQM_B32_si : SOP1_Real_si <0x09, S_WQM_B32>;
|
|
|
|
def S_WQM_B64_si : SOP1_Real_si <0x0a, S_WQM_B64>;
|
|
|
|
def S_BREV_B32_si : SOP1_Real_si <0x0b, S_BREV_B32>;
|
|
|
|
def S_BREV_B64_si : SOP1_Real_si <0x0c, S_BREV_B64>;
|
|
|
|
def S_BCNT0_I32_B32_si : SOP1_Real_si <0x0d, S_BCNT0_I32_B32>;
|
|
|
|
def S_BCNT0_I32_B64_si : SOP1_Real_si <0x0e, S_BCNT0_I32_B64>;
|
|
|
|
def S_BCNT1_I32_B32_si : SOP1_Real_si <0x0f, S_BCNT1_I32_B32>;
|
|
|
|
def S_BCNT1_I32_B64_si : SOP1_Real_si <0x10, S_BCNT1_I32_B64>;
|
|
|
|
def S_FF0_I32_B32_si : SOP1_Real_si <0x11, S_FF0_I32_B32>;
|
|
|
|
def S_FF0_I32_B64_si : SOP1_Real_si <0x12, S_FF0_I32_B64>;
|
|
|
|
def S_FF1_I32_B32_si : SOP1_Real_si <0x13, S_FF1_I32_B32>;
|
|
|
|
def S_FF1_I32_B64_si : SOP1_Real_si <0x14, S_FF1_I32_B64>;
|
|
|
|
def S_FLBIT_I32_B32_si : SOP1_Real_si <0x15, S_FLBIT_I32_B32>;
|
|
|
|
def S_FLBIT_I32_B64_si : SOP1_Real_si <0x16, S_FLBIT_I32_B64>;
|
|
|
|
def S_FLBIT_I32_si : SOP1_Real_si <0x17, S_FLBIT_I32>;
|
|
|
|
def S_FLBIT_I32_I64_si : SOP1_Real_si <0x18, S_FLBIT_I32_I64>;
|
|
|
|
def S_SEXT_I32_I8_si : SOP1_Real_si <0x19, S_SEXT_I32_I8>;
|
|
|
|
def S_SEXT_I32_I16_si : SOP1_Real_si <0x1a, S_SEXT_I32_I16>;
|
|
|
|
def S_BITSET0_B32_si : SOP1_Real_si <0x1b, S_BITSET0_B32>;
|
|
|
|
def S_BITSET0_B64_si : SOP1_Real_si <0x1c, S_BITSET0_B64>;
|
|
|
|
def S_BITSET1_B32_si : SOP1_Real_si <0x1d, S_BITSET1_B32>;
|
|
|
|
def S_BITSET1_B64_si : SOP1_Real_si <0x1e, S_BITSET1_B64>;
|
|
|
|
def S_GETPC_B64_si : SOP1_Real_si <0x1f, S_GETPC_B64>;
|
|
|
|
def S_SETPC_B64_si : SOP1_Real_si <0x20, S_SETPC_B64>;
|
|
|
|
def S_SWAPPC_B64_si : SOP1_Real_si <0x21, S_SWAPPC_B64>;
|
|
|
|
def S_RFE_B64_si : SOP1_Real_si <0x22, S_RFE_B64>;
|
|
|
|
def S_AND_SAVEEXEC_B64_si : SOP1_Real_si <0x24, S_AND_SAVEEXEC_B64>;
|
|
|
|
def S_OR_SAVEEXEC_B64_si : SOP1_Real_si <0x25, S_OR_SAVEEXEC_B64>;
|
|
|
|
def S_XOR_SAVEEXEC_B64_si : SOP1_Real_si <0x26, S_XOR_SAVEEXEC_B64>;
|
|
|
|
def S_ANDN2_SAVEEXEC_B64_si: SOP1_Real_si <0x27, S_ANDN2_SAVEEXEC_B64>;
|
|
|
|
def S_ORN2_SAVEEXEC_B64_si : SOP1_Real_si <0x28, S_ORN2_SAVEEXEC_B64>;
|
|
|
|
def S_NAND_SAVEEXEC_B64_si : SOP1_Real_si <0x29, S_NAND_SAVEEXEC_B64>;
|
|
|
|
def S_NOR_SAVEEXEC_B64_si : SOP1_Real_si <0x2a, S_NOR_SAVEEXEC_B64>;
|
|
|
|
def S_XNOR_SAVEEXEC_B64_si : SOP1_Real_si <0x2b, S_XNOR_SAVEEXEC_B64>;
|
|
|
|
def S_QUADMASK_B32_si : SOP1_Real_si <0x2c, S_QUADMASK_B32>;
|
|
|
|
def S_QUADMASK_B64_si : SOP1_Real_si <0x2d, S_QUADMASK_B64>;
|
|
|
|
def S_MOVRELS_B32_si : SOP1_Real_si <0x2e, S_MOVRELS_B32>;
|
|
|
|
def S_MOVRELS_B64_si : SOP1_Real_si <0x2f, S_MOVRELS_B64>;
|
|
|
|
def S_MOVRELD_B32_si : SOP1_Real_si <0x30, S_MOVRELD_B32>;
|
|
|
|
def S_MOVRELD_B64_si : SOP1_Real_si <0x31, S_MOVRELD_B64>;
|
|
|
|
def S_CBRANCH_JOIN_si : SOP1_Real_si <0x32, S_CBRANCH_JOIN>;
|
|
|
|
def S_MOV_REGRD_B32_si : SOP1_Real_si <0x33, S_MOV_REGRD_B32>;
|
|
|
|
def S_ABS_I32_si : SOP1_Real_si <0x34, S_ABS_I32>;
|
|
|
|
def S_MOV_FED_B32_si : SOP1_Real_si <0x35, S_MOV_FED_B32>;
|
|
|
|
|
|
|
|
def S_ADD_U32_si : SOP2_Real_si <0x00, S_ADD_U32>;
|
|
|
|
def S_ADD_I32_si : SOP2_Real_si <0x02, S_ADD_I32>;
|
|
|
|
def S_SUB_U32_si : SOP2_Real_si <0x01, S_SUB_U32>;
|
|
|
|
def S_SUB_I32_si : SOP2_Real_si <0x03, S_SUB_I32>;
|
|
|
|
def S_ADDC_U32_si : SOP2_Real_si <0x04, S_ADDC_U32>;
|
|
|
|
def S_SUBB_U32_si : SOP2_Real_si <0x05, S_SUBB_U32>;
|
|
|
|
def S_MIN_I32_si : SOP2_Real_si <0x06, S_MIN_I32>;
|
|
|
|
def S_MIN_U32_si : SOP2_Real_si <0x07, S_MIN_U32>;
|
|
|
|
def S_MAX_I32_si : SOP2_Real_si <0x08, S_MAX_I32>;
|
|
|
|
def S_MAX_U32_si : SOP2_Real_si <0x09, S_MAX_U32>;
|
|
|
|
def S_CSELECT_B32_si : SOP2_Real_si <0x0a, S_CSELECT_B32>;
|
|
|
|
def S_CSELECT_B64_si : SOP2_Real_si <0x0b, S_CSELECT_B64>;
|
|
|
|
def S_AND_B32_si : SOP2_Real_si <0x0e, S_AND_B32>;
|
|
|
|
def S_AND_B64_si : SOP2_Real_si <0x0f, S_AND_B64>;
|
|
|
|
def S_OR_B32_si : SOP2_Real_si <0x10, S_OR_B32>;
|
|
|
|
def S_OR_B64_si : SOP2_Real_si <0x11, S_OR_B64>;
|
|
|
|
def S_XOR_B32_si : SOP2_Real_si <0x12, S_XOR_B32>;
|
|
|
|
def S_XOR_B64_si : SOP2_Real_si <0x13, S_XOR_B64>;
|
|
|
|
def S_ANDN2_B32_si : SOP2_Real_si <0x14, S_ANDN2_B32>;
|
|
|
|
def S_ANDN2_B64_si : SOP2_Real_si <0x15, S_ANDN2_B64>;
|
|
|
|
def S_ORN2_B32_si : SOP2_Real_si <0x16, S_ORN2_B32>;
|
|
|
|
def S_ORN2_B64_si : SOP2_Real_si <0x17, S_ORN2_B64>;
|
|
|
|
def S_NAND_B32_si : SOP2_Real_si <0x18, S_NAND_B32>;
|
|
|
|
def S_NAND_B64_si : SOP2_Real_si <0x19, S_NAND_B64>;
|
|
|
|
def S_NOR_B32_si : SOP2_Real_si <0x1a, S_NOR_B32>;
|
|
|
|
def S_NOR_B64_si : SOP2_Real_si <0x1b, S_NOR_B64>;
|
|
|
|
def S_XNOR_B32_si : SOP2_Real_si <0x1c, S_XNOR_B32>;
|
|
|
|
def S_XNOR_B64_si : SOP2_Real_si <0x1d, S_XNOR_B64>;
|
|
|
|
def S_LSHL_B32_si : SOP2_Real_si <0x1e, S_LSHL_B32>;
|
|
|
|
def S_LSHL_B64_si : SOP2_Real_si <0x1f, S_LSHL_B64>;
|
|
|
|
def S_LSHR_B32_si : SOP2_Real_si <0x20, S_LSHR_B32>;
|
|
|
|
def S_LSHR_B64_si : SOP2_Real_si <0x21, S_LSHR_B64>;
|
|
|
|
def S_ASHR_I32_si : SOP2_Real_si <0x22, S_ASHR_I32>;
|
|
|
|
def S_ASHR_I64_si : SOP2_Real_si <0x23, S_ASHR_I64>;
|
|
|
|
def S_BFM_B32_si : SOP2_Real_si <0x24, S_BFM_B32>;
|
|
|
|
def S_BFM_B64_si : SOP2_Real_si <0x25, S_BFM_B64>;
|
|
|
|
def S_MUL_I32_si : SOP2_Real_si <0x26, S_MUL_I32>;
|
|
|
|
def S_BFE_U32_si : SOP2_Real_si <0x27, S_BFE_U32>;
|
|
|
|
def S_BFE_I32_si : SOP2_Real_si <0x28, S_BFE_I32>;
|
|
|
|
def S_BFE_U64_si : SOP2_Real_si <0x29, S_BFE_U64>;
|
|
|
|
def S_BFE_I64_si : SOP2_Real_si <0x2a, S_BFE_I64>;
|
|
|
|
def S_CBRANCH_G_FORK_si : SOP2_Real_si <0x2b, S_CBRANCH_G_FORK>;
|
|
|
|
def S_ABSDIFF_I32_si : SOP2_Real_si <0x2c, S_ABSDIFF_I32>;
|
|
|
|
|
|
|
|
def S_MOVK_I32_si : SOPK_Real_si <0x00, S_MOVK_I32>;
|
|
|
|
def S_CMOVK_I32_si : SOPK_Real_si <0x02, S_CMOVK_I32>;
|
|
|
|
def S_CMPK_EQ_I32_si : SOPK_Real_si <0x03, S_CMPK_EQ_I32>;
|
|
|
|
def S_CMPK_LG_I32_si : SOPK_Real_si <0x04, S_CMPK_LG_I32>;
|
|
|
|
def S_CMPK_GT_I32_si : SOPK_Real_si <0x05, S_CMPK_GT_I32>;
|
|
|
|
def S_CMPK_GE_I32_si : SOPK_Real_si <0x06, S_CMPK_GE_I32>;
|
|
|
|
def S_CMPK_LT_I32_si : SOPK_Real_si <0x07, S_CMPK_LT_I32>;
|
|
|
|
def S_CMPK_LE_I32_si : SOPK_Real_si <0x08, S_CMPK_LE_I32>;
|
|
|
|
def S_CMPK_EQ_U32_si : SOPK_Real_si <0x09, S_CMPK_EQ_U32>;
|
|
|
|
def S_CMPK_LG_U32_si : SOPK_Real_si <0x0a, S_CMPK_LG_U32>;
|
|
|
|
def S_CMPK_GT_U32_si : SOPK_Real_si <0x0b, S_CMPK_GT_U32>;
|
|
|
|
def S_CMPK_GE_U32_si : SOPK_Real_si <0x0c, S_CMPK_GE_U32>;
|
|
|
|
def S_CMPK_LT_U32_si : SOPK_Real_si <0x0d, S_CMPK_LT_U32>;
|
|
|
|
def S_CMPK_LE_U32_si : SOPK_Real_si <0x0e, S_CMPK_LE_U32>;
|
|
|
|
def S_ADDK_I32_si : SOPK_Real_si <0x0f, S_ADDK_I32>;
|
|
|
|
def S_MULK_I32_si : SOPK_Real_si <0x10, S_MULK_I32>;
|
|
|
|
def S_CBRANCH_I_FORK_si : SOPK_Real_si <0x11, S_CBRANCH_I_FORK>;
|
|
|
|
def S_GETREG_B32_si : SOPK_Real_si <0x12, S_GETREG_B32>;
|
|
|
|
def S_SETREG_B32_si : SOPK_Real_si <0x13, S_SETREG_B32>;
|
|
|
|
//def S_GETREG_REGRD_B32_si : SOPK_Real_si <0x14, S_GETREG_REGRD_B32>; // see pseudo for comments
|
|
|
|
def S_SETREG_IMM32_B32_si : SOPK_Real64<0x15, S_SETREG_IMM32_B32>,
|
|
|
|
Select_si<S_SETREG_IMM32_B32.Mnemonic>;
|
|
|
|
|
|
|
|
|
|
|
|
class Select_vi<string opName> :
|
|
|
|
SIMCInstr<opName, SIEncodingFamily.VI> {
|
2019-02-23 07:21:06 +08:00
|
|
|
list<Predicate> AssemblerPredicates = [isVI];
|
2016-08-30 23:20:31 +08:00
|
|
|
string DecoderNamespace = "VI";
|
|
|
|
}
|
|
|
|
|
|
|
|
class SOP1_Real_vi<bits<8> op, SOP1_Pseudo ps> :
|
|
|
|
SOP1_Real<op, ps>,
|
|
|
|
Select_vi<ps.Mnemonic>;
|
|
|
|
|
|
|
|
|
|
|
|
class SOP2_Real_vi<bits<7> op, SOP2_Pseudo ps> :
|
|
|
|
SOP2_Real<op, ps>,
|
|
|
|
Select_vi<ps.Mnemonic>;
|
|
|
|
|
|
|
|
class SOPK_Real_vi<bits<5> op, SOPK_Pseudo ps> :
|
|
|
|
SOPK_Real32<op, ps>,
|
|
|
|
Select_vi<ps.Mnemonic>;
|
|
|
|
|
|
|
|
def S_MOV_B32_vi : SOP1_Real_vi <0x00, S_MOV_B32>;
|
|
|
|
def S_MOV_B64_vi : SOP1_Real_vi <0x01, S_MOV_B64>;
|
|
|
|
def S_CMOV_B32_vi : SOP1_Real_vi <0x02, S_CMOV_B32>;
|
|
|
|
def S_CMOV_B64_vi : SOP1_Real_vi <0x03, S_CMOV_B64>;
|
|
|
|
def S_NOT_B32_vi : SOP1_Real_vi <0x04, S_NOT_B32>;
|
|
|
|
def S_NOT_B64_vi : SOP1_Real_vi <0x05, S_NOT_B64>;
|
|
|
|
def S_WQM_B32_vi : SOP1_Real_vi <0x06, S_WQM_B32>;
|
|
|
|
def S_WQM_B64_vi : SOP1_Real_vi <0x07, S_WQM_B64>;
|
|
|
|
def S_BREV_B32_vi : SOP1_Real_vi <0x08, S_BREV_B32>;
|
|
|
|
def S_BREV_B64_vi : SOP1_Real_vi <0x09, S_BREV_B64>;
|
|
|
|
def S_BCNT0_I32_B32_vi : SOP1_Real_vi <0x0a, S_BCNT0_I32_B32>;
|
|
|
|
def S_BCNT0_I32_B64_vi : SOP1_Real_vi <0x0b, S_BCNT0_I32_B64>;
|
|
|
|
def S_BCNT1_I32_B32_vi : SOP1_Real_vi <0x0c, S_BCNT1_I32_B32>;
|
|
|
|
def S_BCNT1_I32_B64_vi : SOP1_Real_vi <0x0d, S_BCNT1_I32_B64>;
|
|
|
|
def S_FF0_I32_B32_vi : SOP1_Real_vi <0x0e, S_FF0_I32_B32>;
|
|
|
|
def S_FF0_I32_B64_vi : SOP1_Real_vi <0x0f, S_FF0_I32_B64>;
|
|
|
|
def S_FF1_I32_B32_vi : SOP1_Real_vi <0x10, S_FF1_I32_B32>;
|
|
|
|
def S_FF1_I32_B64_vi : SOP1_Real_vi <0x11, S_FF1_I32_B64>;
|
|
|
|
def S_FLBIT_I32_B32_vi : SOP1_Real_vi <0x12, S_FLBIT_I32_B32>;
|
|
|
|
def S_FLBIT_I32_B64_vi : SOP1_Real_vi <0x13, S_FLBIT_I32_B64>;
|
|
|
|
def S_FLBIT_I32_vi : SOP1_Real_vi <0x14, S_FLBIT_I32>;
|
|
|
|
def S_FLBIT_I32_I64_vi : SOP1_Real_vi <0x15, S_FLBIT_I32_I64>;
|
|
|
|
def S_SEXT_I32_I8_vi : SOP1_Real_vi <0x16, S_SEXT_I32_I8>;
|
|
|
|
def S_SEXT_I32_I16_vi : SOP1_Real_vi <0x17, S_SEXT_I32_I16>;
|
|
|
|
def S_BITSET0_B32_vi : SOP1_Real_vi <0x18, S_BITSET0_B32>;
|
|
|
|
def S_BITSET0_B64_vi : SOP1_Real_vi <0x19, S_BITSET0_B64>;
|
|
|
|
def S_BITSET1_B32_vi : SOP1_Real_vi <0x1a, S_BITSET1_B32>;
|
|
|
|
def S_BITSET1_B64_vi : SOP1_Real_vi <0x1b, S_BITSET1_B64>;
|
|
|
|
def S_GETPC_B64_vi : SOP1_Real_vi <0x1c, S_GETPC_B64>;
|
|
|
|
def S_SETPC_B64_vi : SOP1_Real_vi <0x1d, S_SETPC_B64>;
|
|
|
|
def S_SWAPPC_B64_vi : SOP1_Real_vi <0x1e, S_SWAPPC_B64>;
|
|
|
|
def S_RFE_B64_vi : SOP1_Real_vi <0x1f, S_RFE_B64>;
|
|
|
|
def S_AND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x20, S_AND_SAVEEXEC_B64>;
|
|
|
|
def S_OR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x21, S_OR_SAVEEXEC_B64>;
|
|
|
|
def S_XOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x22, S_XOR_SAVEEXEC_B64>;
|
|
|
|
def S_ANDN2_SAVEEXEC_B64_vi: SOP1_Real_vi <0x23, S_ANDN2_SAVEEXEC_B64>;
|
|
|
|
def S_ORN2_SAVEEXEC_B64_vi : SOP1_Real_vi <0x24, S_ORN2_SAVEEXEC_B64>;
|
|
|
|
def S_NAND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x25, S_NAND_SAVEEXEC_B64>;
|
|
|
|
def S_NOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x26, S_NOR_SAVEEXEC_B64>;
|
|
|
|
def S_XNOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x27, S_XNOR_SAVEEXEC_B64>;
|
|
|
|
def S_QUADMASK_B32_vi : SOP1_Real_vi <0x28, S_QUADMASK_B32>;
|
|
|
|
def S_QUADMASK_B64_vi : SOP1_Real_vi <0x29, S_QUADMASK_B64>;
|
|
|
|
def S_MOVRELS_B32_vi : SOP1_Real_vi <0x2a, S_MOVRELS_B32>;
|
|
|
|
def S_MOVRELS_B64_vi : SOP1_Real_vi <0x2b, S_MOVRELS_B64>;
|
|
|
|
def S_MOVRELD_B32_vi : SOP1_Real_vi <0x2c, S_MOVRELD_B32>;
|
|
|
|
def S_MOVRELD_B64_vi : SOP1_Real_vi <0x2d, S_MOVRELD_B64>;
|
|
|
|
def S_CBRANCH_JOIN_vi : SOP1_Real_vi <0x2e, S_CBRANCH_JOIN>;
|
|
|
|
def S_MOV_REGRD_B32_vi : SOP1_Real_vi <0x2f, S_MOV_REGRD_B32>;
|
|
|
|
def S_ABS_I32_vi : SOP1_Real_vi <0x30, S_ABS_I32>;
|
|
|
|
def S_MOV_FED_B32_vi : SOP1_Real_vi <0x31, S_MOV_FED_B32>;
|
2016-10-13 02:00:51 +08:00
|
|
|
def S_SET_GPR_IDX_IDX_vi : SOP1_Real_vi <0x32, S_SET_GPR_IDX_IDX>;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
def S_ADD_U32_vi : SOP2_Real_vi <0x00, S_ADD_U32>;
|
|
|
|
def S_ADD_I32_vi : SOP2_Real_vi <0x02, S_ADD_I32>;
|
|
|
|
def S_SUB_U32_vi : SOP2_Real_vi <0x01, S_SUB_U32>;
|
|
|
|
def S_SUB_I32_vi : SOP2_Real_vi <0x03, S_SUB_I32>;
|
|
|
|
def S_ADDC_U32_vi : SOP2_Real_vi <0x04, S_ADDC_U32>;
|
|
|
|
def S_SUBB_U32_vi : SOP2_Real_vi <0x05, S_SUBB_U32>;
|
|
|
|
def S_MIN_I32_vi : SOP2_Real_vi <0x06, S_MIN_I32>;
|
|
|
|
def S_MIN_U32_vi : SOP2_Real_vi <0x07, S_MIN_U32>;
|
|
|
|
def S_MAX_I32_vi : SOP2_Real_vi <0x08, S_MAX_I32>;
|
|
|
|
def S_MAX_U32_vi : SOP2_Real_vi <0x09, S_MAX_U32>;
|
|
|
|
def S_CSELECT_B32_vi : SOP2_Real_vi <0x0a, S_CSELECT_B32>;
|
|
|
|
def S_CSELECT_B64_vi : SOP2_Real_vi <0x0b, S_CSELECT_B64>;
|
|
|
|
def S_AND_B32_vi : SOP2_Real_vi <0x0c, S_AND_B32>;
|
|
|
|
def S_AND_B64_vi : SOP2_Real_vi <0x0d, S_AND_B64>;
|
|
|
|
def S_OR_B32_vi : SOP2_Real_vi <0x0e, S_OR_B32>;
|
|
|
|
def S_OR_B64_vi : SOP2_Real_vi <0x0f, S_OR_B64>;
|
|
|
|
def S_XOR_B32_vi : SOP2_Real_vi <0x10, S_XOR_B32>;
|
|
|
|
def S_XOR_B64_vi : SOP2_Real_vi <0x11, S_XOR_B64>;
|
|
|
|
def S_ANDN2_B32_vi : SOP2_Real_vi <0x12, S_ANDN2_B32>;
|
|
|
|
def S_ANDN2_B64_vi : SOP2_Real_vi <0x13, S_ANDN2_B64>;
|
|
|
|
def S_ORN2_B32_vi : SOP2_Real_vi <0x14, S_ORN2_B32>;
|
|
|
|
def S_ORN2_B64_vi : SOP2_Real_vi <0x15, S_ORN2_B64>;
|
|
|
|
def S_NAND_B32_vi : SOP2_Real_vi <0x16, S_NAND_B32>;
|
|
|
|
def S_NAND_B64_vi : SOP2_Real_vi <0x17, S_NAND_B64>;
|
|
|
|
def S_NOR_B32_vi : SOP2_Real_vi <0x18, S_NOR_B32>;
|
|
|
|
def S_NOR_B64_vi : SOP2_Real_vi <0x19, S_NOR_B64>;
|
|
|
|
def S_XNOR_B32_vi : SOP2_Real_vi <0x1a, S_XNOR_B32>;
|
|
|
|
def S_XNOR_B64_vi : SOP2_Real_vi <0x1b, S_XNOR_B64>;
|
|
|
|
def S_LSHL_B32_vi : SOP2_Real_vi <0x1c, S_LSHL_B32>;
|
|
|
|
def S_LSHL_B64_vi : SOP2_Real_vi <0x1d, S_LSHL_B64>;
|
|
|
|
def S_LSHR_B32_vi : SOP2_Real_vi <0x1e, S_LSHR_B32>;
|
|
|
|
def S_LSHR_B64_vi : SOP2_Real_vi <0x1f, S_LSHR_B64>;
|
|
|
|
def S_ASHR_I32_vi : SOP2_Real_vi <0x20, S_ASHR_I32>;
|
|
|
|
def S_ASHR_I64_vi : SOP2_Real_vi <0x21, S_ASHR_I64>;
|
|
|
|
def S_BFM_B32_vi : SOP2_Real_vi <0x22, S_BFM_B32>;
|
|
|
|
def S_BFM_B64_vi : SOP2_Real_vi <0x23, S_BFM_B64>;
|
|
|
|
def S_MUL_I32_vi : SOP2_Real_vi <0x24, S_MUL_I32>;
|
|
|
|
def S_BFE_U32_vi : SOP2_Real_vi <0x25, S_BFE_U32>;
|
|
|
|
def S_BFE_I32_vi : SOP2_Real_vi <0x26, S_BFE_I32>;
|
|
|
|
def S_BFE_U64_vi : SOP2_Real_vi <0x27, S_BFE_U64>;
|
|
|
|
def S_BFE_I64_vi : SOP2_Real_vi <0x28, S_BFE_I64>;
|
|
|
|
def S_CBRANCH_G_FORK_vi : SOP2_Real_vi <0x29, S_CBRANCH_G_FORK>;
|
|
|
|
def S_ABSDIFF_I32_vi : SOP2_Real_vi <0x2a, S_ABSDIFF_I32>;
|
2017-02-28 02:49:11 +08:00
|
|
|
def S_PACK_LL_B32_B16_vi : SOP2_Real_vi <0x32, S_PACK_LL_B32_B16>;
|
|
|
|
def S_PACK_LH_B32_B16_vi : SOP2_Real_vi <0x33, S_PACK_LH_B32_B16>;
|
|
|
|
def S_PACK_HH_B32_B16_vi : SOP2_Real_vi <0x34, S_PACK_HH_B32_B16>;
|
2017-04-13 01:10:07 +08:00
|
|
|
def S_RFE_RESTORE_B64_vi : SOP2_Real_vi <0x2b, S_RFE_RESTORE_B64>;
|
2016-08-30 23:20:31 +08:00
|
|
|
|
|
|
|
def S_MOVK_I32_vi : SOPK_Real_vi <0x00, S_MOVK_I32>;
|
|
|
|
def S_CMOVK_I32_vi : SOPK_Real_vi <0x01, S_CMOVK_I32>;
|
|
|
|
def S_CMPK_EQ_I32_vi : SOPK_Real_vi <0x02, S_CMPK_EQ_I32>;
|
|
|
|
def S_CMPK_LG_I32_vi : SOPK_Real_vi <0x03, S_CMPK_LG_I32>;
|
|
|
|
def S_CMPK_GT_I32_vi : SOPK_Real_vi <0x04, S_CMPK_GT_I32>;
|
|
|
|
def S_CMPK_GE_I32_vi : SOPK_Real_vi <0x05, S_CMPK_GE_I32>;
|
|
|
|
def S_CMPK_LT_I32_vi : SOPK_Real_vi <0x06, S_CMPK_LT_I32>;
|
|
|
|
def S_CMPK_LE_I32_vi : SOPK_Real_vi <0x07, S_CMPK_LE_I32>;
|
|
|
|
def S_CMPK_EQ_U32_vi : SOPK_Real_vi <0x08, S_CMPK_EQ_U32>;
|
|
|
|
def S_CMPK_LG_U32_vi : SOPK_Real_vi <0x09, S_CMPK_LG_U32>;
|
|
|
|
def S_CMPK_GT_U32_vi : SOPK_Real_vi <0x0A, S_CMPK_GT_U32>;
|
|
|
|
def S_CMPK_GE_U32_vi : SOPK_Real_vi <0x0B, S_CMPK_GE_U32>;
|
|
|
|
def S_CMPK_LT_U32_vi : SOPK_Real_vi <0x0C, S_CMPK_LT_U32>;
|
|
|
|
def S_CMPK_LE_U32_vi : SOPK_Real_vi <0x0D, S_CMPK_LE_U32>;
|
|
|
|
def S_ADDK_I32_vi : SOPK_Real_vi <0x0E, S_ADDK_I32>;
|
|
|
|
def S_MULK_I32_vi : SOPK_Real_vi <0x0F, S_MULK_I32>;
|
|
|
|
def S_CBRANCH_I_FORK_vi : SOPK_Real_vi <0x10, S_CBRANCH_I_FORK>;
|
|
|
|
def S_GETREG_B32_vi : SOPK_Real_vi <0x11, S_GETREG_B32>;
|
|
|
|
def S_SETREG_B32_vi : SOPK_Real_vi <0x12, S_SETREG_B32>;
|
|
|
|
//def S_GETREG_REGRD_B32_vi : SOPK_Real_vi <0x13, S_GETREG_REGRD_B32>; // see pseudo for comments
|
|
|
|
def S_SETREG_IMM32_B32_vi : SOPK_Real64<0x14, S_SETREG_IMM32_B32>,
|
2016-09-07 04:00:26 +08:00
|
|
|
Select_vi<S_SETREG_IMM32_B32.Mnemonic>;
|
2018-04-07 00:35:11 +08:00
|
|
|
|
2018-04-07 02:24:49 +08:00
|
|
|
def S_CALL_B64_vi : SOPK_Real_vi <0x15, S_CALL_B64>;
|
|
|
|
|
2018-04-07 00:35:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOP1 - GFX9.
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
def S_ANDN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x33, S_ANDN1_SAVEEXEC_B64>;
|
|
|
|
def S_ORN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x34, S_ORN1_SAVEEXEC_B64>;
|
|
|
|
def S_ANDN1_WREXEC_B64_vi : SOP1_Real_vi<0x35, S_ANDN1_WREXEC_B64>;
|
|
|
|
def S_ANDN2_WREXEC_B64_vi : SOP1_Real_vi<0x36, S_ANDN2_WREXEC_B64>;
|
|
|
|
def S_BITREPLICATE_B64_B32_vi : SOP1_Real_vi<0x37, S_BITREPLICATE_B64_B32>;
|
2018-04-09 21:10:33 +08:00
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SOP2 - GFX9.
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
def S_LSHL1_ADD_U32_vi : SOP2_Real_vi<0x2e, S_LSHL1_ADD_U32>;
|
|
|
|
def S_LSHL2_ADD_U32_vi : SOP2_Real_vi<0x2f, S_LSHL2_ADD_U32>;
|
|
|
|
def S_LSHL3_ADD_U32_vi : SOP2_Real_vi<0x30, S_LSHL3_ADD_U32>;
|
|
|
|
def S_LSHL4_ADD_U32_vi : SOP2_Real_vi<0x31, S_LSHL4_ADD_U32>;
|
|
|
|
def S_MUL_HI_U32_vi : SOP2_Real_vi<0x2c, S_MUL_HI_U32>;
|
|
|
|
def S_MUL_HI_I32_vi : SOP2_Real_vi<0x2d, S_MUL_HI_I32>;
|