mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-11-05 13:09:10 +00:00
692ee102eb
* Added R600_Reg64 class * Added T#Index#.XY registers definition * Added v2i32 register reads from parameter and global space * Added f32 and i32 elements extraction from v2f32 and v2i32 * Added v2i32 -> v2f32 conversions Tom Stellard: - Mark vec2 operations as expand. The addition of a vec2 register class made them all legal. Patch by: Dmitry Cherkassov Signed-off-by: Dmitry Cherkassov <dcherkassov@gmail.com> git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@187582 91177308-0d34-0410-b5e6-96231b3b80d8
234 lines
9.0 KiB
TableGen
234 lines
9.0 KiB
TableGen
|
|
class R600Reg <string name, bits<16> encoding> : Register<name> {
|
|
let Namespace = "AMDGPU";
|
|
let HWEncoding = encoding;
|
|
}
|
|
|
|
class R600RegWithChan <string name, bits<9> sel, string chan> :
|
|
Register <name> {
|
|
|
|
field bits<2> chan_encoding = !if(!eq(chan, "X"), 0,
|
|
!if(!eq(chan, "Y"), 1,
|
|
!if(!eq(chan, "Z"), 2,
|
|
!if(!eq(chan, "W"), 3, 0))));
|
|
let HWEncoding{8-0} = sel;
|
|
let HWEncoding{10-9} = chan_encoding;
|
|
let Namespace = "AMDGPU";
|
|
}
|
|
|
|
class R600Reg_128<string n, list<Register> subregs, bits<16> encoding> :
|
|
RegisterWithSubRegs<n, subregs> {
|
|
let Namespace = "AMDGPU";
|
|
let SubRegIndices = [sub0, sub1, sub2, sub3];
|
|
let HWEncoding = encoding;
|
|
}
|
|
|
|
class R600Reg_64<string n, list<Register> subregs, bits<16> encoding> :
|
|
RegisterWithSubRegs<n, subregs> {
|
|
let Namespace = "AMDGPU";
|
|
let SubRegIndices = [sub0, sub1];
|
|
let HWEncoding = encoding;
|
|
}
|
|
|
|
|
|
foreach Index = 0-127 in {
|
|
foreach Chan = [ "X", "Y", "Z", "W" ] in {
|
|
// 32-bit Temporary Registers
|
|
def T#Index#_#Chan : R600RegWithChan <"T"#Index#"."#Chan, Index, Chan>;
|
|
|
|
// Indirect addressing offset registers
|
|
def Addr#Index#_#Chan : R600RegWithChan <"T("#Index#" + AR.x)."#Chan,
|
|
Index, Chan>;
|
|
def TRegMem#Index#_#Chan : R600RegWithChan <"T"#Index#"."#Chan, Index,
|
|
Chan>;
|
|
}
|
|
// 128-bit Temporary Registers
|
|
def T#Index#_XYZW : R600Reg_128 <"T"#Index#"",
|
|
[!cast<Register>("T"#Index#"_X"),
|
|
!cast<Register>("T"#Index#"_Y"),
|
|
!cast<Register>("T"#Index#"_Z"),
|
|
!cast<Register>("T"#Index#"_W")],
|
|
Index>;
|
|
|
|
def T#Index#_XY : R600Reg_64 <"T"#Index#"",
|
|
[!cast<Register>("T"#Index#"_X"),
|
|
!cast<Register>("T"#Index#"_Y")],
|
|
Index>;
|
|
}
|
|
|
|
// KCACHE_BANK0
|
|
foreach Index = 159-128 in {
|
|
foreach Chan = [ "X", "Y", "Z", "W" ] in {
|
|
// 32-bit Temporary Registers
|
|
def KC0_#Index#_#Chan : R600RegWithChan <"KC0["#!add(Index,-128)#"]."#Chan, Index, Chan>;
|
|
}
|
|
// 128-bit Temporary Registers
|
|
def KC0_#Index#_XYZW : R600Reg_128 <"KC0["#!add(Index, -128)#"].XYZW",
|
|
[!cast<Register>("KC0_"#Index#"_X"),
|
|
!cast<Register>("KC0_"#Index#"_Y"),
|
|
!cast<Register>("KC0_"#Index#"_Z"),
|
|
!cast<Register>("KC0_"#Index#"_W")],
|
|
Index>;
|
|
}
|
|
|
|
// KCACHE_BANK1
|
|
foreach Index = 191-160 in {
|
|
foreach Chan = [ "X", "Y", "Z", "W" ] in {
|
|
// 32-bit Temporary Registers
|
|
def KC1_#Index#_#Chan : R600RegWithChan <"KC1["#!add(Index,-160)#"]."#Chan, Index, Chan>;
|
|
}
|
|
// 128-bit Temporary Registers
|
|
def KC1_#Index#_XYZW : R600Reg_128 <"KC1["#!add(Index, -160)#"].XYZW",
|
|
[!cast<Register>("KC1_"#Index#"_X"),
|
|
!cast<Register>("KC1_"#Index#"_Y"),
|
|
!cast<Register>("KC1_"#Index#"_Z"),
|
|
!cast<Register>("KC1_"#Index#"_W")],
|
|
Index>;
|
|
}
|
|
|
|
|
|
// Array Base Register holding input in FS
|
|
foreach Index = 448-480 in {
|
|
def ArrayBase#Index : R600Reg<"ARRAY_BASE", Index>;
|
|
}
|
|
|
|
|
|
// Special Registers
|
|
|
|
def ZERO : R600Reg<"0.0", 248>;
|
|
def ONE : R600Reg<"1.0", 249>;
|
|
def NEG_ONE : R600Reg<"-1.0", 249>;
|
|
def ONE_INT : R600Reg<"1", 250>;
|
|
def HALF : R600Reg<"0.5", 252>;
|
|
def NEG_HALF : R600Reg<"-0.5", 252>;
|
|
def ALU_LITERAL_X : R600RegWithChan<"literal.x", 253, "X">;
|
|
def ALU_LITERAL_Y : R600RegWithChan<"literal.y", 253, "Y">;
|
|
def ALU_LITERAL_Z : R600RegWithChan<"literal.z", 253, "Z">;
|
|
def ALU_LITERAL_W : R600RegWithChan<"literal.w", 253, "W">;
|
|
def PV_X : R600RegWithChan<"PV.X", 254, "X">;
|
|
def PV_Y : R600RegWithChan<"PV.Y", 254, "Y">;
|
|
def PV_Z : R600RegWithChan<"PV.Z", 254, "Z">;
|
|
def PV_W : R600RegWithChan<"PV.W", 254, "W">;
|
|
def PS: R600Reg<"PS", 255>;
|
|
def PREDICATE_BIT : R600Reg<"PredicateBit", 0>;
|
|
def PRED_SEL_OFF: R600Reg<"Pred_sel_off", 0>;
|
|
def PRED_SEL_ZERO : R600Reg<"Pred_sel_zero", 2>;
|
|
def PRED_SEL_ONE : R600Reg<"Pred_sel_one", 3>;
|
|
def AR_X : R600Reg<"AR.x", 0>;
|
|
def OQAP : R600Reg<"OQAP", 221>;
|
|
|
|
def R600_ArrayBase : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "ArrayBase%u", 448, 480))>;
|
|
// special registers for ALU src operands
|
|
// const buffer reference, SRCx_SEL contains index
|
|
def ALU_CONST : R600Reg<"CBuf", 0>;
|
|
// interpolation param reference, SRCx_SEL contains index
|
|
def ALU_PARAM : R600Reg<"Param", 0>;
|
|
|
|
let isAllocatable = 0 in {
|
|
|
|
// XXX: Only use the X channel, until we support wider stack widths
|
|
def R600_Addr : RegisterClass <"AMDGPU", [i32], 127, (add (sequence "Addr%u_X", 0, 127))>;
|
|
|
|
} // End isAllocatable = 0
|
|
|
|
def R600_KC0_X : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC0_%u_X", 128, 159))>;
|
|
|
|
def R600_KC0_Y : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC0_%u_Y", 128, 159))>;
|
|
|
|
def R600_KC0_Z : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC0_%u_Z", 128, 159))>;
|
|
|
|
def R600_KC0_W : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC0_%u_W", 128, 159))>;
|
|
|
|
def R600_KC0 : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(interleave R600_KC0_X, R600_KC0_Y,
|
|
R600_KC0_Z, R600_KC0_W)>;
|
|
|
|
def R600_KC1_X : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC1_%u_X", 160, 191))>;
|
|
|
|
def R600_KC1_Y : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC1_%u_Y", 160, 191))>;
|
|
|
|
def R600_KC1_Z : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC1_%u_Z", 160, 191))>;
|
|
|
|
def R600_KC1_W : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "KC1_%u_W", 160, 191))>;
|
|
|
|
def R600_KC1 : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(interleave R600_KC1_X, R600_KC1_Y,
|
|
R600_KC1_Z, R600_KC1_W)>;
|
|
|
|
def R600_TReg32_X : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "T%u_X", 0, 127), AR_X)>;
|
|
|
|
def R600_TReg32_Y : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "T%u_Y", 0, 127))>;
|
|
|
|
def R600_TReg32_Z : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "T%u_Z", 0, 127))>;
|
|
|
|
def R600_TReg32_W : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "T%u_W", 0, 127))>;
|
|
|
|
def R600_TReg32 : RegisterClass <"AMDGPU", [f32, i32], 32,
|
|
(interleave R600_TReg32_X, R600_TReg32_Y,
|
|
R600_TReg32_Z, R600_TReg32_W)>;
|
|
|
|
def R600_Reg32 : RegisterClass <"AMDGPU", [f32, i32], 32, (add
|
|
R600_TReg32,
|
|
R600_ArrayBase,
|
|
R600_Addr,
|
|
ZERO, HALF, ONE, ONE_INT, PV_X, ALU_LITERAL_X, NEG_ONE, NEG_HALF,
|
|
ALU_CONST, ALU_PARAM, OQAP
|
|
)>;
|
|
|
|
def R600_Predicate : RegisterClass <"AMDGPU", [i32], 32, (add
|
|
PRED_SEL_OFF, PRED_SEL_ZERO, PRED_SEL_ONE)>;
|
|
|
|
def R600_Predicate_Bit: RegisterClass <"AMDGPU", [i32], 32, (add
|
|
PREDICATE_BIT)>;
|
|
|
|
def R600_Reg128 : RegisterClass<"AMDGPU", [v4f32, v4i32], 128,
|
|
(add (sequence "T%u_XYZW", 0, 127))> {
|
|
let CopyCost = -1;
|
|
}
|
|
|
|
def R600_Reg64 : RegisterClass<"AMDGPU", [v2f32, v2i32], 64,
|
|
(add (sequence "T%u_XY", 0, 63))>;
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Register classes for indirect addressing
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Super register for all the Indirect Registers. This register class is used
|
|
// by the REG_SEQUENCE instruction to specify the registers to use for direct
|
|
// reads / writes which may be written / read by an indirect address.
|
|
class IndirectSuper<string n, list<Register> subregs> :
|
|
RegisterWithSubRegs<n, subregs> {
|
|
let Namespace = "AMDGPU";
|
|
let SubRegIndices =
|
|
[sub0, sub1, sub2, sub3, sub4, sub5, sub6, sub7,
|
|
sub8, sub9, sub10, sub11, sub12, sub13, sub14, sub15];
|
|
}
|
|
|
|
def IndirectSuperReg : IndirectSuper<"Indirect",
|
|
[TRegMem0_X, TRegMem1_X, TRegMem2_X, TRegMem3_X, TRegMem4_X, TRegMem5_X,
|
|
TRegMem6_X, TRegMem7_X, TRegMem8_X, TRegMem9_X, TRegMem10_X, TRegMem11_X,
|
|
TRegMem12_X, TRegMem13_X, TRegMem14_X, TRegMem15_X]
|
|
>;
|
|
|
|
def IndirectReg : RegisterClass<"AMDGPU", [f32, i32], 32, (add IndirectSuperReg)>;
|
|
|
|
// This register class defines the registers that are the storage units for
|
|
// the "Indirect Addressing" pseudo memory space.
|
|
// XXX: Only use the X channel, until we support wider stack widths
|
|
def TRegMem : RegisterClass<"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "TRegMem%u_X", 0, 16))
|
|
>;
|