Reapply "Make NumMicroOps a variable in the subtarget's instruction itinerary."

Reapplies r159406 with minor cleanup. The regressions appear to have been spurious.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@159541 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Andrew Trick 2012-07-02 18:10:42 +00:00
parent 7c3a65c7ed
commit 218ee74a01
9 changed files with 81 additions and 63 deletions

View File

@ -95,7 +95,7 @@ struct InstrStage {
/// operands are read and written. /// operands are read and written.
/// ///
struct InstrItinerary { struct InstrItinerary {
unsigned NumMicroOps; ///< # of micro-ops, 0 means it's variable int NumMicroOps; ///< # of micro-ops, -1 means it's variable
unsigned FirstStage; ///< Index of first stage in itinerary unsigned FirstStage; ///< Index of first stage in itinerary
unsigned LastStage; ///< Index of last + 1 stage in itinerary unsigned LastStage; ///< Index of last + 1 stage in itinerary
unsigned FirstOperandCycle; ///< Index of first operand rd/wr unsigned FirstOperandCycle; ///< Index of first operand rd/wr
@ -323,7 +323,6 @@ public:
} }
}; };
} // End llvm namespace } // End llvm namespace
#endif #endif

View File

@ -651,7 +651,9 @@ public:
} }
/// getNumMicroOps - Return the number of u-operations the given machine /// getNumMicroOps - Return the number of u-operations the given machine
/// instruction will be decoded to on the target cpu. /// instruction will be decoded to on the target cpu. The itinerary's
/// IssueWidth is the number of microops that can be dispatched each
/// cycle. An instruction with zero microops takes no dispatch resources.
virtual unsigned getNumMicroOps(const InstrItineraryData *ItinData, virtual unsigned getNumMicroOps(const InstrItineraryData *ItinData,
const MachineInstr *MI) const = 0; const MachineInstr *MI) const = 0;

View File

@ -73,20 +73,20 @@ class InstrStage<int cycles, list<FuncUnit> units,
// across all chip sets. Thus a new chip set can be added without modifying // across all chip sets. Thus a new chip set can be added without modifying
// instruction information. // instruction information.
// //
// NumMicroOps represents the number of micro-operations that each instruction class InstrItinClass;
// in the class are decoded to. If the number is zero, then it means the
// instruction can decode into variable number of micro-ops and it must be
// determined dynamically.
//
class InstrItinClass<int ops = 1> {
int NumMicroOps = ops;
}
def NoItinerary : InstrItinClass; def NoItinerary : InstrItinClass;
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
// Instruction itinerary data - These values provide a runtime map of an // Instruction itinerary data - These values provide a runtime map of an
// instruction itinerary class (name) to its itinerary data. // instruction itinerary class (name) to its itinerary data.
// //
// NumMicroOps represents the number of micro-operations that each instruction
// in the class are decoded to. If the number is zero, then it means the
// instruction can decode into variable number of micro-ops and it must be
// determined dynamically. This directly relates to the itineraries
// global IssueWidth property, which constrains the number of microops
// that can issue per cycle.
//
// OperandCycles are optional "cycle counts". They specify the cycle after // OperandCycles are optional "cycle counts". They specify the cycle after
// instruction issue the values which correspond to specific operand indices // instruction issue the values which correspond to specific operand indices
// are defined or read. Bypasses are optional "pipeline forwarding pathes", if // are defined or read. Bypasses are optional "pipeline forwarding pathes", if
@ -106,8 +106,9 @@ def NoItinerary : InstrItinClass;
// is reduced by 1. // is reduced by 1.
class InstrItinData<InstrItinClass Class, list<InstrStage> stages, class InstrItinData<InstrItinClass Class, list<InstrStage> stages,
list<int> operandcycles = [], list<int> operandcycles = [],
list<Bypass> bypasses = []> { list<Bypass> bypasses = [], int uops = 1> {
InstrItinClass TheClass = Class; InstrItinClass TheClass = Class;
int NumMicroOps = uops;
list<InstrStage> Stages = stages; list<InstrStage> Stages = stages;
list<int> OperandCycles = operandcycles; list<int> OperandCycles = operandcycles;
list<Bypass> Bypasses = bypasses; list<Bypass> Bypasses = bypasses;

View File

@ -560,8 +560,8 @@ TargetInstrInfoImpl::getNumMicroOps(const InstrItineraryData *ItinData,
return 1; return 1;
unsigned Class = MI->getDesc().getSchedClass(); unsigned Class = MI->getDesc().getSchedClass();
unsigned UOps = ItinData->Itineraries[Class].NumMicroOps; int UOps = ItinData->Itineraries[Class].NumMicroOps;
if (UOps) if (UOps >= 0)
return UOps; return UOps;
// The # of u-ops is dynamically determined. The specific target should // The # of u-ops is dynamically determined. The specific target should

View File

@ -2176,9 +2176,9 @@ ARMBaseInstrInfo::getNumMicroOps(const InstrItineraryData *ItinData,
const MCInstrDesc &Desc = MI->getDesc(); const MCInstrDesc &Desc = MI->getDesc();
unsigned Class = Desc.getSchedClass(); unsigned Class = Desc.getSchedClass();
unsigned UOps = ItinData->Itineraries[Class].NumMicroOps; int ItinUOps = ItinData->getNumMicroOps(Class);
if (UOps) if (ItinUOps >= 0)
return UOps; return ItinUOps;
unsigned Opc = MI->getOpcode(); unsigned Opc = MI->getOpcode();
switch (Opc) { switch (Opc) {
@ -2252,19 +2252,19 @@ ARMBaseInstrInfo::getNumMicroOps(const InstrItineraryData *ItinData,
return 2; return 2;
// 4 registers would be issued: 2, 2. // 4 registers would be issued: 2, 2.
// 5 registers would be issued: 2, 2, 1. // 5 registers would be issued: 2, 2, 1.
UOps = (NumRegs / 2); int A8UOps = (NumRegs / 2);
if (NumRegs % 2) if (NumRegs % 2)
++UOps; ++A8UOps;
return UOps; return A8UOps;
} else if (Subtarget.isCortexA9()) { } else if (Subtarget.isCortexA9()) {
UOps = (NumRegs / 2); int A9UOps = (NumRegs / 2);
// If there are odd number of registers or if it's not 64-bit aligned, // If there are odd number of registers or if it's not 64-bit aligned,
// then it takes an extra AGU (Address Generation Unit) cycle. // then it takes an extra AGU (Address Generation Unit) cycle.
if ((NumRegs % 2) || if ((NumRegs % 2) ||
!MI->hasOneMemOperand() || !MI->hasOneMemOperand() ||
(*MI->memoperands_begin())->getAlignment() < 8) (*MI->memoperands_begin())->getAlignment() < 8)
++UOps; ++A9UOps;
return UOps; return A9UOps;
} else { } else {
// Assume the worst. // Assume the worst.
return NumRegs; return NumRegs;
@ -3057,7 +3057,8 @@ unsigned ARMBaseInstrInfo::getInstrLatency(const InstrItineraryData *ItinData,
unsigned Class = MCID.getSchedClass(); unsigned Class = MCID.getSchedClass();
// For instructions with variable uops, use uops as latency. // For instructions with variable uops, use uops as latency.
if (!ItinData->isEmpty() && !ItinData->Itineraries[Class].NumMicroOps) { if (!ItinData->isEmpty() && ItinData->getNumMicroOps(Class) < 0) {
dbgs() << "UOPS " << getNumMicroOps(ItinData, MI) << " " << *MI << '\n';
return getNumMicroOps(ItinData, MI); return getNumMicroOps(ItinData, MI);
} }
// For the common case, fall back on the itinerary's latency. // For the common case, fall back on the itinerary's latency.

View File

@ -70,11 +70,11 @@ def IIC_iLoad_bh_siu : InstrItinClass;
def IIC_iLoad_d_i : InstrItinClass; def IIC_iLoad_d_i : InstrItinClass;
def IIC_iLoad_d_r : InstrItinClass; def IIC_iLoad_d_r : InstrItinClass;
def IIC_iLoad_d_ru : InstrItinClass; def IIC_iLoad_d_ru : InstrItinClass;
def IIC_iLoad_m : InstrItinClass<0>; // micro-coded def IIC_iLoad_m : InstrItinClass;
def IIC_iLoad_mu : InstrItinClass<0>; // micro-coded def IIC_iLoad_mu : InstrItinClass;
def IIC_iLoad_mBr : InstrItinClass<0>; // micro-coded def IIC_iLoad_mBr : InstrItinClass;
def IIC_iPop : InstrItinClass<0>; // micro-coded def IIC_iPop : InstrItinClass;
def IIC_iPop_Br : InstrItinClass<0>; // micro-coded def IIC_iPop_Br : InstrItinClass;
def IIC_iLoadiALU : InstrItinClass; def IIC_iLoadiALU : InstrItinClass;
def IIC_iStore_i : InstrItinClass; def IIC_iStore_i : InstrItinClass;
def IIC_iStore_r : InstrItinClass; def IIC_iStore_r : InstrItinClass;
@ -91,8 +91,8 @@ def IIC_iStore_bh_siu : InstrItinClass;
def IIC_iStore_d_i : InstrItinClass; def IIC_iStore_d_i : InstrItinClass;
def IIC_iStore_d_r : InstrItinClass; def IIC_iStore_d_r : InstrItinClass;
def IIC_iStore_d_ru : InstrItinClass; def IIC_iStore_d_ru : InstrItinClass;
def IIC_iStore_m : InstrItinClass<0>; // micro-coded def IIC_iStore_m : InstrItinClass;
def IIC_iStore_mu : InstrItinClass<0>; // micro-coded def IIC_iStore_mu : InstrItinClass;
def IIC_Preload : InstrItinClass; def IIC_Preload : InstrItinClass;
def IIC_Br : InstrItinClass; def IIC_Br : InstrItinClass;
def IIC_fpSTAT : InstrItinClass; def IIC_fpSTAT : InstrItinClass;
@ -126,12 +126,12 @@ def IIC_fpSQRT32 : InstrItinClass;
def IIC_fpSQRT64 : InstrItinClass; def IIC_fpSQRT64 : InstrItinClass;
def IIC_fpLoad32 : InstrItinClass; def IIC_fpLoad32 : InstrItinClass;
def IIC_fpLoad64 : InstrItinClass; def IIC_fpLoad64 : InstrItinClass;
def IIC_fpLoad_m : InstrItinClass<0>; // micro-coded def IIC_fpLoad_m : InstrItinClass;
def IIC_fpLoad_mu : InstrItinClass<0>; // micro-coded def IIC_fpLoad_mu : InstrItinClass;
def IIC_fpStore32 : InstrItinClass; def IIC_fpStore32 : InstrItinClass;
def IIC_fpStore64 : InstrItinClass; def IIC_fpStore64 : InstrItinClass;
def IIC_fpStore_m : InstrItinClass<0>; // micro-coded def IIC_fpStore_m : InstrItinClass;
def IIC_fpStore_mu : InstrItinClass<0>; // micro-coded def IIC_fpStore_mu : InstrItinClass;
def IIC_VLD1 : InstrItinClass; def IIC_VLD1 : InstrItinClass;
def IIC_VLD1x2 : InstrItinClass; def IIC_VLD1x2 : InstrItinClass;
def IIC_VLD1x3 : InstrItinClass; def IIC_VLD1x3 : InstrItinClass;

View File

@ -155,28 +155,30 @@ def CortexA8Itineraries : MultiIssueItineraries<
// Load multiple, def is the 5th operand. Pipeline 0 only. // Load multiple, def is the 5th operand. Pipeline 0 only.
// FIXME: A8_LSPipe cycle time is dynamic, this assumes 3 to 4 registers. // FIXME: A8_LSPipe cycle time is dynamic, this assumes 3 to 4 registers.
InstrItinData<IIC_iLoad_m , [InstrStage<2, [A8_Pipe0], 0>, InstrItinData<IIC_iLoad_m , [InstrStage<2, [A8_Pipe0], 0>,
InstrStage<2, [A8_LSPipe]>], [1, 1, 1, 1, 3]>, InstrStage<2, [A8_LSPipe]>],
[1, 1, 1, 1, 3], [], -1>, // dynamic uops
// //
// Load multiple + update, defs are the 1st and 5th operands. // Load multiple + update, defs are the 1st and 5th operands.
InstrItinData<IIC_iLoad_mu , [InstrStage<3, [A8_Pipe0], 0>, InstrItinData<IIC_iLoad_mu , [InstrStage<3, [A8_Pipe0], 0>,
InstrStage<3, [A8_LSPipe]>], [2, 1, 1, 1, 3]>, InstrStage<3, [A8_LSPipe]>],
[2, 1, 1, 1, 3], [], -1>, // dynamic uops
// //
// Load multiple plus branch // Load multiple plus branch
InstrItinData<IIC_iLoad_mBr, [InstrStage<3, [A8_Pipe0], 0>, InstrItinData<IIC_iLoad_mBr, [InstrStage<3, [A8_Pipe0], 0>,
InstrStage<3, [A8_LSPipe]>, InstrStage<3, [A8_LSPipe]>,
InstrStage<1, [A8_Pipe0, A8_Pipe1]>], InstrStage<1, [A8_Pipe0, A8_Pipe1]>],
[1, 2, 1, 1, 3]>, [1, 2, 1, 1, 3], [], -1>, // dynamic uops
// //
// Pop, def is the 3rd operand. // Pop, def is the 3rd operand.
InstrItinData<IIC_iPop , [InstrStage<3, [A8_Pipe0], 0>, InstrItinData<IIC_iPop , [InstrStage<3, [A8_Pipe0], 0>,
InstrStage<3, [A8_LSPipe]>], [1, 1, 3]>, InstrStage<3, [A8_LSPipe]>],
[1, 1, 3], [], -1>, // dynamic uops
// //
// Push, def is the 3th operand. // Push, def is the 3th operand.
InstrItinData<IIC_iPop_Br, [InstrStage<3, [A8_Pipe0], 0>, InstrItinData<IIC_iPop_Br, [InstrStage<3, [A8_Pipe0], 0>,
InstrStage<3, [A8_LSPipe]>, InstrStage<3, [A8_LSPipe]>,
InstrStage<1, [A8_Pipe0, A8_Pipe1]>], InstrStage<1, [A8_Pipe0, A8_Pipe1]>],
[1, 1, 3]>, [1, 1, 3], [], -1>, // dynamic uops
// //
// iLoadi + iALUr for t2LDRpci_pic. // iLoadi + iALUr for t2LDRpci_pic.
InstrItinData<IIC_iLoadiALU, [InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>, InstrItinData<IIC_iLoadiALU, [InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>,
@ -231,12 +233,13 @@ def CortexA8Itineraries : MultiIssueItineraries<
// Store multiple. Pipeline 0 only. // Store multiple. Pipeline 0 only.
// FIXME: A8_LSPipe cycle time is dynamic, this assumes 3 to 4 registers. // FIXME: A8_LSPipe cycle time is dynamic, this assumes 3 to 4 registers.
InstrItinData<IIC_iStore_m , [InstrStage<2, [A8_Pipe0], 0>, InstrItinData<IIC_iStore_m , [InstrStage<2, [A8_Pipe0], 0>,
InstrStage<2, [A8_LSPipe]>]>, InstrStage<2, [A8_LSPipe]>],
[], [], -1>, // dynamic uops
// //
// Store multiple + update // Store multiple + update
InstrItinData<IIC_iStore_mu, [InstrStage<2, [A8_Pipe0], 0>, InstrItinData<IIC_iStore_mu, [InstrStage<2, [A8_Pipe0], 0>,
InstrStage<2, [A8_LSPipe]>], [2]>, InstrStage<2, [A8_LSPipe]>],
[2], [], -1>, // dynamic uops
// //
// Preload // Preload
InstrItinData<IIC_Preload, [InstrStage<1, [A8_Pipe0, A8_Pipe1]>], [2, 2]>, InstrItinData<IIC_Preload, [InstrStage<1, [A8_Pipe0, A8_Pipe1]>], [2, 2]>,
@ -397,14 +400,16 @@ def CortexA8Itineraries : MultiIssueItineraries<
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>, InstrStage<1, [A8_LSPipe]>,
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>], [1, 1, 1, 2]>, InstrStage<1, [A8_LSPipe]>],
[1, 1, 1, 2], [], -1>, // dynamic uops
// //
// FP Load Multiple + update // FP Load Multiple + update
InstrItinData<IIC_fpLoad_mu,[InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>, InstrItinData<IIC_fpLoad_mu,[InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>,
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>, InstrStage<1, [A8_LSPipe]>,
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>], [2, 1, 1, 1, 2]>, InstrStage<1, [A8_LSPipe]>],
[2, 1, 1, 1, 2], [], -1>, // dynamic uops
// //
// Single-precision FP Store // Single-precision FP Store
InstrItinData<IIC_fpStore32,[InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>, InstrItinData<IIC_fpStore32,[InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>,
@ -423,15 +428,16 @@ def CortexA8Itineraries : MultiIssueItineraries<
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>, InstrStage<1, [A8_LSPipe]>,
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>], [1, 1, 1, 1]>, InstrStage<1, [A8_LSPipe]>],
[1, 1, 1, 1], [], -1>, // dynamic uops
// //
// FP Store Multiple + update // FP Store Multiple + update
InstrItinData<IIC_fpStore_mu,[InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>, InstrItinData<IIC_fpStore_mu,[InstrStage<1, [A8_Pipe0, A8_Pipe1], 0>,
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>, InstrStage<1, [A8_LSPipe]>,
InstrStage<1, [A8_NLSPipe], 0>, InstrStage<1, [A8_NLSPipe], 0>,
InstrStage<1, [A8_LSPipe]>], [2, 1, 1, 1, 1]>, InstrStage<1, [A8_LSPipe]>],
[2, 1, 1, 1, 1], [], -1>, // dynamic uops
// NEON // NEON
// Issue through integer pipeline, and execute in NEON unit. // Issue through integer pipeline, and execute in NEON unit.
// //

View File

@ -284,7 +284,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<2, [A9_AGU], 1>, InstrStage<2, [A9_AGU], 1>,
InstrStage<2, [A9_LSUnit]>], InstrStage<2, [A9_LSUnit]>],
[1, 1, 1, 1, 3], [1, 1, 1, 1, 3],
[NoBypass, NoBypass, NoBypass, NoBypass, A9_LdBypass]>, [NoBypass, NoBypass, NoBypass, NoBypass, A9_LdBypass],
-1>, // dynamic uops
// //
// Load multiple + update, defs are the 1st and 5th operands. // Load multiple + update, defs are the 1st and 5th operands.
InstrItinData<IIC_iLoad_mu , [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iLoad_mu , [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
@ -292,7 +293,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<2, [A9_AGU], 1>, InstrStage<2, [A9_AGU], 1>,
InstrStage<2, [A9_LSUnit]>], InstrStage<2, [A9_LSUnit]>],
[2, 1, 1, 1, 3], [2, 1, 1, 1, 3],
[NoBypass, NoBypass, NoBypass, NoBypass, A9_LdBypass]>, [NoBypass, NoBypass, NoBypass, NoBypass, A9_LdBypass],
-1>, // dynamic uops
// //
// Load multiple plus branch // Load multiple plus branch
InstrItinData<IIC_iLoad_mBr, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iLoad_mBr, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
@ -301,7 +303,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<2, [A9_LSUnit]>, InstrStage<2, [A9_LSUnit]>,
InstrStage<1, [A9_Branch]>], InstrStage<1, [A9_Branch]>],
[1, 2, 1, 1, 3], [1, 2, 1, 1, 3],
[NoBypass, NoBypass, NoBypass, NoBypass, A9_LdBypass]>, [NoBypass, NoBypass, NoBypass, NoBypass, A9_LdBypass],
-1>, // dynamic uops
// //
// Pop, def is the 3rd operand. // Pop, def is the 3rd operand.
InstrItinData<IIC_iPop , [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iPop , [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
@ -309,7 +312,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<2, [A9_AGU], 1>, InstrStage<2, [A9_AGU], 1>,
InstrStage<2, [A9_LSUnit]>], InstrStage<2, [A9_LSUnit]>],
[1, 1, 3], [1, 1, 3],
[NoBypass, NoBypass, A9_LdBypass]>, [NoBypass, NoBypass, A9_LdBypass],
-1>, // dynamic uops
// //
// Pop + branch, def is the 3rd operand. // Pop + branch, def is the 3rd operand.
InstrItinData<IIC_iPop_Br, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iPop_Br, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
@ -318,8 +322,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<2, [A9_LSUnit]>, InstrStage<2, [A9_LSUnit]>,
InstrStage<1, [A9_Branch]>], InstrStage<1, [A9_Branch]>],
[1, 1, 3], [1, 1, 3],
[NoBypass, NoBypass, A9_LdBypass]>, [NoBypass, NoBypass, A9_LdBypass],
-1>, // dynamic uops
// //
// iLoadi + iALUr for t2LDRpci_pic. // iLoadi + iALUr for t2LDRpci_pic.
InstrItinData<IIC_iLoadiALU, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iLoadiALU, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
@ -413,14 +417,15 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrItinData<IIC_iStore_m , [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iStore_m , [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
InstrStage<1, [A9_MUX0], 0>, InstrStage<1, [A9_MUX0], 0>,
InstrStage<1, [A9_AGU], 0>, InstrStage<1, [A9_AGU], 0>,
InstrStage<2, [A9_LSUnit]>]>, InstrStage<2, [A9_LSUnit]>],
[], [], -1>, // dynamic uops
// //
// Store multiple + update // Store multiple + update
InstrItinData<IIC_iStore_mu, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_iStore_mu, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
InstrStage<1, [A9_MUX0], 0>, InstrStage<1, [A9_MUX0], 0>,
InstrStage<1, [A9_AGU], 0>, InstrStage<1, [A9_AGU], 0>,
InstrStage<2, [A9_LSUnit]>], [2]>, InstrStage<2, [A9_LSUnit]>],
[2], [], -1>, // dynamic uops
// //
// Preload // Preload
InstrItinData<IIC_Preload, [InstrStage<1, [A9_Issue0, A9_Issue1]>], [1, 1]>, InstrItinData<IIC_Preload, [InstrStage<1, [A9_Issue0, A9_Issue1]>], [1, 1]>,
@ -717,7 +722,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<1, [A9_DRegsVFP], 0, Required>, InstrStage<1, [A9_DRegsVFP], 0, Required>,
InstrStage<2, [A9_DRegsN], 0, Reserved>, InstrStage<2, [A9_DRegsN], 0, Reserved>,
InstrStage<1, [A9_NPipe], 0>, InstrStage<1, [A9_NPipe], 0>,
InstrStage<2, [A9_LSUnit]>], [1, 1, 1, 1]>, InstrStage<2, [A9_LSUnit]>],
[1, 1, 1, 1], [], -1>, // dynamic uops
// //
// FP Load Multiple + update // FP Load Multiple + update
// FIXME: assumes 2 doubles which requires 2 LS cycles. // FIXME: assumes 2 doubles which requires 2 LS cycles.
@ -726,7 +732,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<1, [A9_DRegsVFP], 0, Required>, InstrStage<1, [A9_DRegsVFP], 0, Required>,
InstrStage<2, [A9_DRegsN], 0, Reserved>, InstrStage<2, [A9_DRegsN], 0, Reserved>,
InstrStage<1, [A9_NPipe], 0>, InstrStage<1, [A9_NPipe], 0>,
InstrStage<2, [A9_LSUnit]>], [2, 1, 1, 1]>, InstrStage<2, [A9_LSUnit]>],
[2, 1, 1, 1], [], -1>, // dynamic uops
// //
// Single-precision FP Store // Single-precision FP Store
InstrItinData<IIC_fpStore32,[InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_fpStore32,[InstrStage<1, [A9_Issue0, A9_Issue1], 0>,
@ -753,7 +760,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<1, [A9_DRegsVFP], 0, Required>, InstrStage<1, [A9_DRegsVFP], 0, Required>,
InstrStage<2, [A9_DRegsN], 0, Reserved>, InstrStage<2, [A9_DRegsN], 0, Reserved>,
InstrStage<1, [A9_NPipe], 0>, InstrStage<1, [A9_NPipe], 0>,
InstrStage<2, [A9_LSUnit]>], [1, 1, 1, 1]>, InstrStage<2, [A9_LSUnit]>],
[1, 1, 1, 1], [], -1>, // dynamic uops
// //
// FP Store Multiple + update // FP Store Multiple + update
// FIXME: assumes 2 doubles which requires 2 LS cycles. // FIXME: assumes 2 doubles which requires 2 LS cycles.
@ -762,7 +770,8 @@ def CortexA9Itineraries : MultiIssueItineraries<
InstrStage<1, [A9_DRegsVFP], 0, Required>, InstrStage<1, [A9_DRegsVFP], 0, Required>,
InstrStage<2, [A9_DRegsN], 0, Reserved>, InstrStage<2, [A9_DRegsN], 0, Reserved>,
InstrStage<1, [A9_NPipe], 0>, InstrStage<1, [A9_NPipe], 0>,
InstrStage<2, [A9_LSUnit]>], [2, 1, 1, 1]>, InstrStage<2, [A9_LSUnit]>],
[2, 1, 1, 1], [], -1>, // dynamic uops
// NEON // NEON
// VLD1 // VLD1
InstrItinData<IIC_VLD1, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>, InstrItinData<IIC_VLD1, [InstrStage<1, [A9_Issue0, A9_Issue1], 0>,

View File

@ -498,7 +498,7 @@ void SubtargetEmitter::EmitStageAndOperandCycleData(raw_ostream &OS,
unsigned Find = ItinClassesMap[Name]; unsigned Find = ItinClassesMap[Name];
// Set up itinerary as location and location + stage count // Set up itinerary as location and location + stage count
unsigned NumUOps = ItinClassList[Find]->getValueAsInt("NumMicroOps"); unsigned NumUOps = ItinData->getValueAsInt("NumMicroOps");
InstrItinerary Intinerary = { NumUOps, FindStage, FindStage + NStages, InstrItinerary Intinerary = { NumUOps, FindStage, FindStage + NStages,
FindOperandCycle, FindOperandCycle,
FindOperandCycle + NOperandCycles}; FindOperandCycle + NOperandCycles};