mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-26 07:34:06 +00:00
[X86] Add support for builtin to read performance monitoring counters.
This patch adds support for a new builtin instruction called __builtin_ia32_rdpmc. Builtin '__builtin_ia32_rdpmc' is defined as a 'GCC builtin'; on X86, it can be used to read performance monitoring counters. It takes as input the index of the performance counter to read, and returns the value of the specified performance counter as a 64-bit number. Calls to this new builtin will map to instruction RDPMC. The index in input to the builtin call is moved to register %ECX. The result of the builtin call is the value of the specified performance counter (RDPMC would return that quantity in registers RDX:RAX). This patch: - Adds builtin int_x86_rdpmc as a GCCBuiltin; - Adds a new x86 DAG node called 'RDPMC_DAG'; - Teaches how to lower this new builtin; - Adds an ISel pattern to select instruction RDPMC; - Fixes the definition of instruction RDPMC adding %RAX and %RDX as implicit definitions, and adding %ECX as implicit use; - Adds a LLVM test to verify that the new builtin is correctly selected. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@212049 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
adb277d42f
commit
e6cfdc8471
@ -26,6 +26,12 @@ let TargetPrefix = "x86" in {
|
|||||||
Intrinsic<[llvm_i64_ty], [llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
Intrinsic<[llvm_i64_ty], [llvm_ptr_ty], [IntrReadWriteArgMem]>;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Read Performance-Monitoring Counter.
|
||||||
|
let TargetPrefix = "x86" in {
|
||||||
|
def int_x86_rdpmc : GCCBuiltin<"__builtin_ia32_rdpmc">,
|
||||||
|
Intrinsic<[llvm_i64_ty], [llvm_i32_ty], []>;
|
||||||
|
}
|
||||||
|
|
||||||
//===----------------------------------------------------------------------===//
|
//===----------------------------------------------------------------------===//
|
||||||
// 3DNow!
|
// 3DNow!
|
||||||
|
|
||||||
|
@ -14225,6 +14225,51 @@ static SDValue getPrefetchNode(unsigned Opc, SDValue Op, SelectionDAG &DAG,
|
|||||||
return SDValue(Res, 0);
|
return SDValue(Res, 0);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// getReadPerformanceCounter - Handles the lowering of builtin intrinsics that
|
||||||
|
// read performance monitor counters (x86_rdpmc).
|
||||||
|
static void getReadPerformanceCounter(SDNode *N, SDLoc DL,
|
||||||
|
SelectionDAG &DAG, const X86Subtarget *Subtarget,
|
||||||
|
SmallVectorImpl<SDValue> &Results) {
|
||||||
|
assert(N->getNumOperands() == 3 && "Unexpected number of operands!");
|
||||||
|
SDVTList Tys = DAG.getVTList(MVT::Other, MVT::Glue);
|
||||||
|
SDValue LO, HI;
|
||||||
|
|
||||||
|
// The ECX register is used to select the index of the performance counter
|
||||||
|
// to read.
|
||||||
|
SDValue Chain = DAG.getCopyToReg(N->getOperand(0), DL, X86::ECX,
|
||||||
|
N->getOperand(2));
|
||||||
|
SDValue rd = DAG.getNode(X86ISD::RDPMC_DAG, DL, Tys, Chain);
|
||||||
|
|
||||||
|
// Reads the content of a 64-bit performance counter and returns it in the
|
||||||
|
// registers EDX:EAX.
|
||||||
|
if (Subtarget->is64Bit()) {
|
||||||
|
LO = DAG.getCopyFromReg(rd, DL, X86::RAX, MVT::i64, rd.getValue(1));
|
||||||
|
HI = DAG.getCopyFromReg(LO.getValue(1), DL, X86::RDX, MVT::i64,
|
||||||
|
LO.getValue(2));
|
||||||
|
} else {
|
||||||
|
LO = DAG.getCopyFromReg(rd, DL, X86::EAX, MVT::i32, rd.getValue(1));
|
||||||
|
HI = DAG.getCopyFromReg(LO.getValue(1), DL, X86::EDX, MVT::i32,
|
||||||
|
LO.getValue(2));
|
||||||
|
}
|
||||||
|
Chain = HI.getValue(1);
|
||||||
|
|
||||||
|
if (Subtarget->is64Bit()) {
|
||||||
|
// The EAX register is loaded with the low-order 32 bits. The EDX register
|
||||||
|
// is loaded with the supported high-order bits of the counter.
|
||||||
|
SDValue Tmp = DAG.getNode(ISD::SHL, DL, MVT::i64, HI,
|
||||||
|
DAG.getConstant(32, MVT::i8));
|
||||||
|
Results.push_back(DAG.getNode(ISD::OR, DL, MVT::i64, LO, Tmp));
|
||||||
|
Results.push_back(Chain);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Use a buildpair to merge the two 32-bit values into a 64-bit one.
|
||||||
|
SDValue Ops[] = { LO, HI };
|
||||||
|
SDValue Pair = DAG.getNode(ISD::BUILD_PAIR, DL, MVT::i64, Ops);
|
||||||
|
Results.push_back(Pair);
|
||||||
|
Results.push_back(Chain);
|
||||||
|
}
|
||||||
|
|
||||||
// getReadTimeStampCounter - Handles the lowering of builtin intrinsics that
|
// getReadTimeStampCounter - Handles the lowering of builtin intrinsics that
|
||||||
// read the time stamp counter (x86_rdtsc and x86_rdtscp). This function is
|
// read the time stamp counter (x86_rdtsc and x86_rdtscp). This function is
|
||||||
// also used to custom lower READCYCLECOUNTER nodes.
|
// also used to custom lower READCYCLECOUNTER nodes.
|
||||||
@ -14289,7 +14334,7 @@ static SDValue LowerREADCYCLECOUNTER(SDValue Op, const X86Subtarget *Subtarget,
|
|||||||
}
|
}
|
||||||
|
|
||||||
enum IntrinsicType {
|
enum IntrinsicType {
|
||||||
GATHER, SCATTER, PREFETCH, RDSEED, RDRAND, RDTSC, XTEST
|
GATHER, SCATTER, PREFETCH, RDSEED, RDRAND, RDPMC, RDTSC, XTEST
|
||||||
};
|
};
|
||||||
|
|
||||||
struct IntrinsicData {
|
struct IntrinsicData {
|
||||||
@ -14383,6 +14428,8 @@ static void InitIntinsicsMap() {
|
|||||||
IntrinsicData(RDTSC, X86ISD::RDTSC_DAG, 0)));
|
IntrinsicData(RDTSC, X86ISD::RDTSC_DAG, 0)));
|
||||||
IntrMap.insert(std::make_pair(Intrinsic::x86_rdtscp,
|
IntrMap.insert(std::make_pair(Intrinsic::x86_rdtscp,
|
||||||
IntrinsicData(RDTSC, X86ISD::RDTSCP_DAG, 0)));
|
IntrinsicData(RDTSC, X86ISD::RDTSCP_DAG, 0)));
|
||||||
|
IntrMap.insert(std::make_pair(Intrinsic::x86_rdpmc,
|
||||||
|
IntrinsicData(RDPMC, X86ISD::RDPMC_DAG, 0)));
|
||||||
Initialized = true;
|
Initialized = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -14458,6 +14505,12 @@ static SDValue LowerINTRINSIC_W_CHAIN(SDValue Op, const X86Subtarget *Subtarget,
|
|||||||
getReadTimeStampCounter(Op.getNode(), dl, Intr.Opc0, DAG, Subtarget, Results);
|
getReadTimeStampCounter(Op.getNode(), dl, Intr.Opc0, DAG, Subtarget, Results);
|
||||||
return DAG.getMergeValues(Results, dl);
|
return DAG.getMergeValues(Results, dl);
|
||||||
}
|
}
|
||||||
|
// Read Performance Monitoring Counters.
|
||||||
|
case RDPMC: {
|
||||||
|
SmallVector<SDValue, 2> Results;
|
||||||
|
getReadPerformanceCounter(Op.getNode(), dl, DAG, Subtarget, Results);
|
||||||
|
return DAG.getMergeValues(Results, dl);
|
||||||
|
}
|
||||||
// XTEST intrinsics.
|
// XTEST intrinsics.
|
||||||
case XTEST: {
|
case XTEST: {
|
||||||
SDVTList VTs = DAG.getVTList(Op->getValueType(0), MVT::Other);
|
SDVTList VTs = DAG.getVTList(Op->getValueType(0), MVT::Other);
|
||||||
@ -16282,6 +16335,8 @@ void X86TargetLowering::ReplaceNodeResults(SDNode *N,
|
|||||||
case Intrinsic::x86_rdtscp:
|
case Intrinsic::x86_rdtscp:
|
||||||
return getReadTimeStampCounter(N, dl, X86ISD::RDTSCP_DAG, DAG, Subtarget,
|
return getReadTimeStampCounter(N, dl, X86ISD::RDTSCP_DAG, DAG, Subtarget,
|
||||||
Results);
|
Results);
|
||||||
|
case Intrinsic::x86_rdpmc:
|
||||||
|
return getReadPerformanceCounter(N, dl, DAG, Subtarget, Results);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
case ISD::READCYCLECOUNTER: {
|
case ISD::READCYCLECOUNTER: {
|
||||||
@ -16446,6 +16501,7 @@ const char *X86TargetLowering::getTargetNodeName(unsigned Opcode) const {
|
|||||||
case X86ISD::CALL: return "X86ISD::CALL";
|
case X86ISD::CALL: return "X86ISD::CALL";
|
||||||
case X86ISD::RDTSC_DAG: return "X86ISD::RDTSC_DAG";
|
case X86ISD::RDTSC_DAG: return "X86ISD::RDTSC_DAG";
|
||||||
case X86ISD::RDTSCP_DAG: return "X86ISD::RDTSCP_DAG";
|
case X86ISD::RDTSCP_DAG: return "X86ISD::RDTSCP_DAG";
|
||||||
|
case X86ISD::RDPMC_DAG: return "X86ISD::RDPMC_DAG";
|
||||||
case X86ISD::BT: return "X86ISD::BT";
|
case X86ISD::BT: return "X86ISD::BT";
|
||||||
case X86ISD::CMP: return "X86ISD::CMP";
|
case X86ISD::CMP: return "X86ISD::CMP";
|
||||||
case X86ISD::COMI: return "X86ISD::COMI";
|
case X86ISD::COMI: return "X86ISD::COMI";
|
||||||
|
@ -86,6 +86,9 @@ namespace llvm {
|
|||||||
/// X86 Read Time-Stamp Counter and Processor ID.
|
/// X86 Read Time-Stamp Counter and Processor ID.
|
||||||
RDTSCP_DAG,
|
RDTSCP_DAG,
|
||||||
|
|
||||||
|
/// X86 Read Performance Monitoring Counters.
|
||||||
|
RDPMC_DAG,
|
||||||
|
|
||||||
/// X86 compare and logical compare instructions.
|
/// X86 compare and logical compare instructions.
|
||||||
CMP, COMI, UCOMI,
|
CMP, COMI, UCOMI,
|
||||||
|
|
||||||
|
@ -208,6 +208,8 @@ def X86rdtsc : SDNode<"X86ISD::RDTSC_DAG", SDTX86Void,
|
|||||||
[SDNPHasChain, SDNPOutGlue, SDNPSideEffect]>;
|
[SDNPHasChain, SDNPOutGlue, SDNPSideEffect]>;
|
||||||
def X86rdtscp : SDNode<"X86ISD::RDTSCP_DAG", SDTX86Void,
|
def X86rdtscp : SDNode<"X86ISD::RDTSCP_DAG", SDTX86Void,
|
||||||
[SDNPHasChain, SDNPOutGlue, SDNPSideEffect]>;
|
[SDNPHasChain, SDNPOutGlue, SDNPSideEffect]>;
|
||||||
|
def X86rdpmc : SDNode<"X86ISD::RDPMC_DAG", SDTX86Void,
|
||||||
|
[SDNPHasChain, SDNPOutGlue, SDNPSideEffect]>;
|
||||||
|
|
||||||
def X86Wrapper : SDNode<"X86ISD::Wrapper", SDTX86Wrapper>;
|
def X86Wrapper : SDNode<"X86ISD::Wrapper", SDTX86Wrapper>;
|
||||||
def X86WrapperRIP : SDNode<"X86ISD::WrapperRIP", SDTX86Wrapper>;
|
def X86WrapperRIP : SDNode<"X86ISD::WrapperRIP", SDTX86Wrapper>;
|
||||||
|
@ -439,7 +439,10 @@ def LLDT16m : I<0x00, MRM2m, (outs), (ins i16mem:$src),
|
|||||||
let SchedRW = [WriteSystem] in {
|
let SchedRW = [WriteSystem] in {
|
||||||
def WRMSR : I<0x30, RawFrm, (outs), (ins), "wrmsr", [], IIC_WRMSR>, TB;
|
def WRMSR : I<0x30, RawFrm, (outs), (ins), "wrmsr", [], IIC_WRMSR>, TB;
|
||||||
def RDMSR : I<0x32, RawFrm, (outs), (ins), "rdmsr", [], IIC_RDMSR>, TB;
|
def RDMSR : I<0x32, RawFrm, (outs), (ins), "rdmsr", [], IIC_RDMSR>, TB;
|
||||||
def RDPMC : I<0x33, RawFrm, (outs), (ins), "rdpmc", [], IIC_RDPMC>, TB;
|
|
||||||
|
let Defs = [RAX, RDX], Uses = [ECX] in
|
||||||
|
def RDPMC : I<0x33, RawFrm, (outs), (ins), "rdpmc", [(X86rdpmc)], IIC_RDPMC>,
|
||||||
|
TB;
|
||||||
|
|
||||||
def SMSW16r : I<0x01, MRM4r, (outs GR16:$dst), (ins),
|
def SMSW16r : I<0x01, MRM4r, (outs GR16:$dst), (ins),
|
||||||
"smsw{w}\t$dst", [], IIC_SMSW>, OpSize16, TB;
|
"smsw{w}\t$dst", [], IIC_SMSW>, OpSize16, TB;
|
||||||
|
22
test/CodeGen/X86/rdpmc.ll
Normal file
22
test/CodeGen/X86/rdpmc.ll
Normal file
@ -0,0 +1,22 @@
|
|||||||
|
; RUN: llc < %s -march=x86-64 -mcpu=generic | FileCheck %s --check-prefix=CHECK --check-prefix=X86-64
|
||||||
|
; RUN: llc < %s -march=x86 -mcpu=generic | FileCheck %s --check-prefix=CHECK --check-prefix=X86
|
||||||
|
|
||||||
|
; Verify that we correctly lower the "Read Performance-Monitoring Counters"
|
||||||
|
; x86 builtin.
|
||||||
|
|
||||||
|
|
||||||
|
define i64 @test_builtin_read_pmc(i32 %ID) {
|
||||||
|
%1 = tail call i64 @llvm.x86.rdpmc(i32 %ID)
|
||||||
|
ret i64 %1
|
||||||
|
}
|
||||||
|
; CHECK-LABEL: test_builtin_read_pmc
|
||||||
|
; CHECK: rdpmc
|
||||||
|
; X86-NOT: shlq
|
||||||
|
; X86-NOT: or
|
||||||
|
; X86-64: shlq
|
||||||
|
; X86-64: or
|
||||||
|
; CHECK-NOT: mov
|
||||||
|
; CHECK: ret
|
||||||
|
|
||||||
|
declare i64 @llvm.x86.rdpmc(i32 %ID)
|
||||||
|
|
Loading…
x
Reference in New Issue
Block a user