mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-11-09 10:05:41 +00:00
f95b162188
The SelectionDAGBuilder was promoting vector kernel arguments to legal types, but this won't work for R600 and SI since kernel arguments are stored in memory and can't be promoted. In order to handle vector arguments correctly we need to look at the original types from the LLVM IR function. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@193215 91177308-0d34-0410-b5e6-96231b3b80d8
195 lines
8.5 KiB
TableGen
195 lines
8.5 KiB
TableGen
//===-- SIRegisterInfo.td - SI Register defs ---------------*- tablegen -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Declarations that describe the SI registers
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
class SIReg <string n, bits<16> encoding = 0> : Register<n> {
|
|
let Namespace = "AMDGPU";
|
|
let HWEncoding = encoding;
|
|
}
|
|
|
|
// Special Registers
|
|
def VCC : SIReg<"VCC", 106>;
|
|
def EXEC : SIReg<"EXEC", 126>;
|
|
def SCC : SIReg<"SCC", 253>;
|
|
def M0 : SIReg <"M0", 124>;
|
|
|
|
// SGPR registers
|
|
foreach Index = 0-101 in {
|
|
def SGPR#Index : SIReg <"SGPR"#Index, Index>;
|
|
}
|
|
|
|
// VGPR registers
|
|
foreach Index = 0-255 in {
|
|
def VGPR#Index : SIReg <"VGPR"#Index, Index> {
|
|
let HWEncoding{8} = 1;
|
|
}
|
|
}
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Groupings using register classes and tuples
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// SGPR 32-bit registers
|
|
def SGPR_32 : RegisterClass<"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "SGPR%u", 0, 101))>;
|
|
|
|
// SGPR 64-bit registers
|
|
def SGPR_64Regs : RegisterTuples<[sub0, sub1],
|
|
[(add (decimate (trunc SGPR_32, 101), 2)),
|
|
(add (decimate (shl SGPR_32, 1), 2))]>;
|
|
|
|
// SGPR 128-bit registers
|
|
def SGPR_128 : RegisterTuples<[sub0, sub1, sub2, sub3],
|
|
[(add (decimate (trunc SGPR_32, 99), 4)),
|
|
(add (decimate (shl SGPR_32, 1), 4)),
|
|
(add (decimate (shl SGPR_32, 2), 4)),
|
|
(add (decimate (shl SGPR_32, 3), 4))]>;
|
|
|
|
// SGPR 256-bit registers
|
|
def SGPR_256 : RegisterTuples<[sub0, sub1, sub2, sub3, sub4, sub5, sub6, sub7],
|
|
[(add (decimate (trunc SGPR_32, 95), 4)),
|
|
(add (decimate (shl SGPR_32, 1), 4)),
|
|
(add (decimate (shl SGPR_32, 2), 4)),
|
|
(add (decimate (shl SGPR_32, 3), 4)),
|
|
(add (decimate (shl SGPR_32, 4), 4)),
|
|
(add (decimate (shl SGPR_32, 5), 4)),
|
|
(add (decimate (shl SGPR_32, 6), 4)),
|
|
(add (decimate (shl SGPR_32, 7), 4))]>;
|
|
|
|
// SGPR 512-bit registers
|
|
def SGPR_512 : RegisterTuples<[sub0, sub1, sub2, sub3, sub4, sub5, sub6, sub7,
|
|
sub8, sub9, sub10, sub11, sub12, sub13, sub14, sub15],
|
|
[(add (decimate (trunc SGPR_32, 87), 4)),
|
|
(add (decimate (shl SGPR_32, 1), 4)),
|
|
(add (decimate (shl SGPR_32, 2), 4)),
|
|
(add (decimate (shl SGPR_32, 3), 4)),
|
|
(add (decimate (shl SGPR_32, 4), 4)),
|
|
(add (decimate (shl SGPR_32, 5), 4)),
|
|
(add (decimate (shl SGPR_32, 6), 4)),
|
|
(add (decimate (shl SGPR_32, 7), 4)),
|
|
(add (decimate (shl SGPR_32, 8), 4)),
|
|
(add (decimate (shl SGPR_32, 9), 4)),
|
|
(add (decimate (shl SGPR_32, 10), 4)),
|
|
(add (decimate (shl SGPR_32, 11), 4)),
|
|
(add (decimate (shl SGPR_32, 12), 4)),
|
|
(add (decimate (shl SGPR_32, 13), 4)),
|
|
(add (decimate (shl SGPR_32, 14), 4)),
|
|
(add (decimate (shl SGPR_32, 15), 4))]>;
|
|
|
|
// VGPR 32-bit registers
|
|
def VGPR_32 : RegisterClass<"AMDGPU", [f32, i32], 32,
|
|
(add (sequence "VGPR%u", 0, 255))>;
|
|
|
|
// VGPR 64-bit registers
|
|
def VGPR_64 : RegisterTuples<[sub0, sub1],
|
|
[(add (trunc VGPR_32, 255)),
|
|
(add (shl VGPR_32, 1))]>;
|
|
|
|
// VGPR 96-bit registers
|
|
def VGPR_96 : RegisterTuples<[sub0, sub1, sub2],
|
|
[(add (trunc VGPR_32, 254)),
|
|
(add (shl VGPR_32, 1)),
|
|
(add (shl VGPR_32, 2))]>;
|
|
|
|
// VGPR 128-bit registers
|
|
def VGPR_128 : RegisterTuples<[sub0, sub1, sub2, sub3],
|
|
[(add (trunc VGPR_32, 253)),
|
|
(add (shl VGPR_32, 1)),
|
|
(add (shl VGPR_32, 2)),
|
|
(add (shl VGPR_32, 3))]>;
|
|
|
|
// VGPR 256-bit registers
|
|
def VGPR_256 : RegisterTuples<[sub0, sub1, sub2, sub3, sub4, sub5, sub6, sub7],
|
|
[(add (trunc VGPR_32, 249)),
|
|
(add (shl VGPR_32, 1)),
|
|
(add (shl VGPR_32, 2)),
|
|
(add (shl VGPR_32, 3)),
|
|
(add (shl VGPR_32, 4)),
|
|
(add (shl VGPR_32, 5)),
|
|
(add (shl VGPR_32, 6)),
|
|
(add (shl VGPR_32, 7))]>;
|
|
|
|
// VGPR 512-bit registers
|
|
def VGPR_512 : RegisterTuples<[sub0, sub1, sub2, sub3, sub4, sub5, sub6, sub7,
|
|
sub8, sub9, sub10, sub11, sub12, sub13, sub14, sub15],
|
|
[(add (trunc VGPR_32, 241)),
|
|
(add (shl VGPR_32, 1)),
|
|
(add (shl VGPR_32, 2)),
|
|
(add (shl VGPR_32, 3)),
|
|
(add (shl VGPR_32, 4)),
|
|
(add (shl VGPR_32, 5)),
|
|
(add (shl VGPR_32, 6)),
|
|
(add (shl VGPR_32, 7)),
|
|
(add (shl VGPR_32, 8)),
|
|
(add (shl VGPR_32, 9)),
|
|
(add (shl VGPR_32, 10)),
|
|
(add (shl VGPR_32, 11)),
|
|
(add (shl VGPR_32, 12)),
|
|
(add (shl VGPR_32, 13)),
|
|
(add (shl VGPR_32, 14)),
|
|
(add (shl VGPR_32, 15))]>;
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// Register classes used as source and destination
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Special register classes for predicates and the M0 register
|
|
def SCCReg : RegisterClass<"AMDGPU", [i32, i1], 32, (add SCC)>;
|
|
def VCCReg : RegisterClass<"AMDGPU", [i64, i1], 64, (add VCC)>;
|
|
def EXECReg : RegisterClass<"AMDGPU", [i64, i1], 64, (add EXEC)>;
|
|
def M0Reg : RegisterClass<"AMDGPU", [i32], 32, (add M0)>;
|
|
|
|
// Register class for all scalar registers (SGPRs + Special Registers)
|
|
def SReg_32 : RegisterClass<"AMDGPU", [f32, i32], 32,
|
|
(add SGPR_32, M0Reg)
|
|
>;
|
|
|
|
def SGPR_64 : RegisterClass<"AMDGPU", [v2i32, i64], 64, (add SGPR_64Regs)>;
|
|
|
|
def SReg_64 : RegisterClass<"AMDGPU", [v2i32, i64, i1], 64,
|
|
(add SGPR_64Regs, VCCReg, EXECReg)
|
|
>;
|
|
|
|
def SReg_128 : RegisterClass<"AMDGPU", [i128, v4i32], 128, (add SGPR_128)>;
|
|
|
|
def SReg_256 : RegisterClass<"AMDGPU", [v32i8, v8i32, v8f32], 256, (add SGPR_256)>;
|
|
|
|
def SReg_512 : RegisterClass<"AMDGPU", [v64i8, v16i32], 512, (add SGPR_512)>;
|
|
|
|
// Register class for all vector registers (VGPRs + Interploation Registers)
|
|
def VReg_32 : RegisterClass<"AMDGPU", [i32, f32, v1i32], 32, (add VGPR_32)>;
|
|
|
|
def VReg_64 : RegisterClass<"AMDGPU", [i64, f64, v2i32, v2f32], 64, (add VGPR_64)>;
|
|
|
|
def VReg_96 : RegisterClass<"AMDGPU", [untyped], 96, (add VGPR_96)> {
|
|
let Size = 96;
|
|
}
|
|
|
|
def VReg_128 : RegisterClass<"AMDGPU", [v4i32, v4f32, i128], 128, (add VGPR_128)>;
|
|
|
|
def VReg_256 : RegisterClass<"AMDGPU", [v32i8, v8i32, v8f32], 256, (add VGPR_256)>;
|
|
|
|
def VReg_512 : RegisterClass<"AMDGPU", [v16i32, v16f32], 512, (add VGPR_512)>;
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// [SV]Src_* register classes, can have either an immediate or an register
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
def SSrc_32 : RegisterClass<"AMDGPU", [i32, f32], 32, (add SReg_32)>;
|
|
|
|
def SSrc_64 : RegisterClass<"AMDGPU", [i64, f64, i1], 64, (add SReg_64)>;
|
|
|
|
def VSrc_32 : RegisterClass<"AMDGPU", [i32, f32], 32, (add VReg_32, SReg_32)>;
|
|
|
|
def VSrc_64 : RegisterClass<"AMDGPU", [i64, f64], 64, (add VReg_64, SReg_64)>;
|
|
|