24#define DEBUG_TYPE "llvm-mca-instrbuilder"
36 : STI(sti), MCII(mcii),
MRI(mri), MCIA(mcia), IM(
im), FirstCallInst(
true),
37 FirstReturnInst(
true), CallLatency(cl) {
50 using ResourcePlusCycles = std::pair<uint64_t, ResourceUsage>;
66 APInt Buffers(NumProcResources, 0);
68 bool AllInOrderResources =
true;
69 bool AnyDispatchHazards =
false;
76 <<
"Ignoring invalid write of zero cycles on processor resource "
79 <<
" (write index #" <<
I <<
")\n";
86 AllInOrderResources =
false;
101 ID.MustIssueImmediately = AllInOrderResources && AnyDispatchHazards;
105 sort(Worklist, [](
const ResourcePlusCycles &
A,
const ResourcePlusCycles &
B) {
108 if (popcntA < popcntB)
110 if (popcntA > popcntB)
112 return A.first <
B.first;
117 uint64_t UnitsFromResourceGroups = 0;
121 ID.HasPartiallyOverlappingGroups =
false;
123 for (
unsigned I = 0,
E = Worklist.
size();
I <
E; ++
I) {
124 ResourcePlusCycles &
A = Worklist[
I];
125 if (!
A.second.size()) {
131 ID.Resources.emplace_back(
A);
135 UsedResourceUnits |=
A.first;
139 if (UnitsFromResourceGroups & NormalizedMask)
140 ID.HasPartiallyOverlappingGroups =
true;
142 UnitsFromResourceGroups |= NormalizedMask;
143 UsedResourceGroups |= (
A.first ^ NormalizedMask);
146 for (
unsigned J =
I + 1; J <
E; ++J) {
147 ResourcePlusCycles &
B = Worklist[J];
148 if ((NormalizedMask &
B.first) == NormalizedMask) {
149 B.second.CS.subtract(
A.second.size() - SuperResources[
A.first]);
173 for (ResourcePlusCycles &RPC :
ID.Resources) {
179 RPC.second.setReserved();
180 RPC.second.NumUnits = MaxResourceUnits;
186 for (
const std::pair<uint64_t, unsigned> &SR : SuperResources) {
187 for (
unsigned I = 1,
E = NumProcResources;
I <
E; ++
I) {
193 if (Mask != SR.first && ((Mask & SR.first) == SR.first))
199 ID.UsedProcResUnits = UsedResourceUnits;
200 ID.UsedProcResGroups = UsedResourceGroups;
203 for (
const std::pair<uint64_t, ResourceUsage> &R :
ID.Resources)
205 <<
"Reserved=" << R.second.isReserved() <<
", "
206 <<
"#Units=" << R.second.NumUnits <<
", "
207 <<
"cy=" << R.second.size() <<
'\n';
210 uint64_t Current = BufferIDs & (-BufferIDs);
212 BufferIDs ^= Current;
214 dbgs() <<
"\t\t Used Units=" <<
format_hex(
ID.UsedProcResUnits, 16) <<
'\n';
217 dbgs() <<
"\t\tHasPartiallyOverlappingGroups="
218 <<
ID.HasPartiallyOverlappingGroups <<
'\n';
225 unsigned CallLatency) {
229 ID.MaxLatency = CallLatency;
236 ID.MaxLatency = Latency < 0 ? CallLatency : static_cast<unsigned>(
Latency);
242 unsigned NumExplicitDefs = MCDesc.
getNumDefs();
249 if (NumExplicitDefs) {
250 return make_error<InstructionError<MCInst>>(
251 "Expected more register operand definitions.", MCI);
258 std::string Message =
259 "expected a register operand for an optional definition. Instruction "
260 "has not been correctly analyzed.";
261 return make_error<InstructionError<MCInst>>(Message, MCI);
268void InstrBuilder::populateWrites(InstrDesc &
ID,
const MCInst &MCI,
269 unsigned SchedClassID) {
317 unsigned NumExplicitDefs = MCDesc.
getNumDefs();
320 unsigned TotalDefs = NumExplicitDefs + NumImplicitDefs;
325 ID.Writes.resize(TotalDefs + NumVariadicOps);
329 unsigned CurrentDef = 0;
332 for (; i < MCI.
getNumOperands() && CurrentDef < NumExplicitDefs; ++i) {
337 if (MCDesc.
operands()[CurrentDef].isOptionalDef()) {
338 OptionalDefIdx = CurrentDef++;
346 WriteDescriptor &
Write =
ID.Writes[CurrentDef];
348 if (CurrentDef < NumWriteLatencyEntries) {
349 const MCWriteLatencyEntry &WLE =
353 WLE.Cycles < 0 ?
ID.MaxLatency :
static_cast<unsigned>(WLE.Cycles);
354 Write.SClassOrWriteResourceID = WLE.WriteResourceID;
358 Write.SClassOrWriteResourceID = 0;
360 Write.IsOptionalDef =
false;
362 dbgs() <<
"\t\t[Def] OpIdx=" <<
Write.OpIndex
363 <<
", Latency=" <<
Write.Latency
364 <<
", WriteResourceID=" <<
Write.SClassOrWriteResourceID <<
'\n';
369 assert(CurrentDef == NumExplicitDefs &&
370 "Expected more register operand definitions.");
371 for (CurrentDef = 0; CurrentDef < NumImplicitDefs; ++CurrentDef) {
372 unsigned Index = NumExplicitDefs + CurrentDef;
374 Write.OpIndex = ~CurrentDef;
376 if (
Index < NumWriteLatencyEntries) {
377 const MCWriteLatencyEntry &WLE =
381 WLE.Cycles < 0 ?
ID.MaxLatency :
static_cast<unsigned>(WLE.Cycles);
382 Write.SClassOrWriteResourceID = WLE.WriteResourceID;
386 Write.SClassOrWriteResourceID = 0;
389 Write.IsOptionalDef =
false;
390 assert(
Write.RegisterID != 0 &&
"Expected a valid phys register!");
392 dbgs() <<
"\t\t[Def][I] OpIdx=" << ~Write.OpIndex
394 <<
", Latency=" <<
Write.Latency
395 <<
", WriteResourceID=" <<
Write.SClassOrWriteResourceID <<
'\n';
400 WriteDescriptor &
Write =
ID.Writes[NumExplicitDefs + NumImplicitDefs];
401 Write.OpIndex = OptionalDefIdx;
404 Write.SClassOrWriteResourceID = 0;
405 Write.IsOptionalDef =
true;
407 dbgs() <<
"\t\t[Def][O] OpIdx=" <<
Write.OpIndex
408 <<
", Latency=" <<
Write.Latency
409 <<
", WriteResourceID=" <<
Write.SClassOrWriteResourceID <<
'\n';
417 CurrentDef = NumExplicitDefs + NumImplicitDefs + MCDesc.
hasOptionalDef();
419 I < NumVariadicOps && !AssumeUsesOnly; ++
I, ++
OpIndex) {
426 WriteDescriptor &
Write =
ID.Writes[CurrentDef];
430 Write.SClassOrWriteResourceID = 0;
431 Write.IsOptionalDef =
false;
434 dbgs() <<
"\t\t[Def][V] OpIdx=" <<
Write.OpIndex
435 <<
", Latency=" <<
Write.Latency
436 <<
", WriteResourceID=" <<
Write.SClassOrWriteResourceID <<
'\n';
440 ID.Writes.resize(CurrentDef);
443void InstrBuilder::populateReads(InstrDesc &
ID,
const MCInst &MCI,
444 unsigned SchedClassID) {
445 const MCInstrDesc &MCDesc = MCII.
get(MCI.getOpcode());
446 unsigned NumExplicitUses = MCDesc.
getNumOperands() - MCDesc.getNumDefs();
447 unsigned NumImplicitUses = MCDesc.implicit_uses().size();
449 if (MCDesc.hasOptionalDef())
451 unsigned NumVariadicOps = MCI.getNumOperands() - MCDesc.getNumOperands();
452 unsigned TotalUses = NumExplicitUses + NumImplicitUses + NumVariadicOps;
453 ID.Reads.resize(TotalUses);
454 unsigned CurrentUse = 0;
455 for (
unsigned I = 0,
OpIndex = MCDesc.getNumDefs();
I < NumExplicitUses;
457 const MCOperand &
Op = MCI.getOperand(
OpIndex);
463 ReadDescriptor &
Read =
ID.Reads[CurrentUse];
466 Read.SchedClassID = SchedClassID;
469 <<
", UseIndex=" <<
Read.UseIndex <<
'\n');
474 for (
unsigned I = 0;
I < NumImplicitUses; ++
I) {
475 ReadDescriptor &
Read =
ID.Reads[CurrentUse +
I];
477 Read.UseIndex = NumExplicitUses +
I;
478 Read.RegisterID = MCDesc.implicit_uses()[
I];
481 Read.SchedClassID = SchedClassID;
483 <<
", UseIndex=" <<
Read.UseIndex <<
", RegisterID="
487 CurrentUse += NumImplicitUses;
489 bool AssumeDefsOnly = MCDesc.variadicOpsAreDefs();
490 for (
unsigned I = 0,
OpIndex = MCDesc.getNumOperands();
491 I < NumVariadicOps && !AssumeDefsOnly; ++
I, ++
OpIndex) {
492 const MCOperand &
Op = MCI.getOperand(
OpIndex);
496 ReadDescriptor &
Read =
ID.Reads[CurrentUse];
498 Read.UseIndex = NumExplicitUses + NumImplicitUses +
I;
499 Read.SchedClassID = SchedClassID;
502 <<
", UseIndex=" <<
Read.UseIndex <<
'\n');
505 ID.Reads.resize(CurrentUse);
523 return InstructionHash;
526Error InstrBuilder::verifyInstrDesc(
const InstrDesc &
ID,
527 const MCInst &MCI)
const {
528 if (
ID.NumMicroOps != 0)
531 bool UsesBuffers =
ID.UsedBuffers;
532 bool UsesResources = !
ID.Resources.empty();
533 if (!UsesBuffers && !UsesResources)
538 StringRef Message =
"found an inconsistent instruction that decodes to zero "
539 "opcodes and that consumes scheduler resources.";
540 return make_error<InstructionError<MCInst>>(std::string(Message), MCI);
543Expected<unsigned> InstrBuilder::getVariantSchedClassID(
const MCInst &MCI,
544 unsigned SchedClassID) {
547 while (SchedClassID && SM.getSchedClassDesc(SchedClassID)->isVariant())
552 return make_error<InstructionError<MCInst>>(
553 "unable to resolve scheduling class for write variant.", MCI);
559Expected<const InstrDesc &>
560InstrBuilder::createInstrDescImpl(
const MCInst &MCI,
561 const SmallVector<Instrument *> &IVec) {
563 "Itineraries are not yet supported!");
566 unsigned short Opcode = MCI.getOpcode();
567 const MCInstrDesc &MCDesc = MCII.
get(Opcode);
573 bool IsVariant = SM.getSchedClassDesc(SchedClassID)->isVariant();
577 Expected<unsigned> VariantSchedClassIDOrErr =
578 getVariantSchedClassID(MCI, SchedClassID);
579 if (!VariantSchedClassIDOrErr) {
580 return VariantSchedClassIDOrErr.takeError();
583 SchedClassID = *VariantSchedClassIDOrErr;
587 const MCSchedClassDesc &SCDesc = *SM.getSchedClassDesc(SchedClassID);
589 return make_error<InstructionError<MCInst>>(
590 "found an unsupported instruction in the input assembly sequence", MCI);
594 LLVM_DEBUG(
dbgs() <<
"\t\tSchedClassID=" << SchedClassID <<
'\n');
598 std::unique_ptr<InstrDesc>
ID = std::make_unique<InstrDesc>();
599 ID->NumMicroOps = SCDesc.NumMicroOps;
600 ID->SchedClassID = SchedClassID;
602 if (MCDesc.isCall() && FirstCallInst) {
606 <<
"Assume a latency of " << CallLatency <<
"cy.\n";
607 FirstCallInst =
false;
610 if (MCDesc.isReturn() && FirstReturnInst) {
612 <<
" assembly sequence.\n";
614 FirstReturnInst =
false;
621 return std::move(Err);
623 populateWrites(*
ID, MCI, SchedClassID);
624 populateReads(*
ID, MCI, SchedClassID);
630 if (Error Err = verifyInstrDesc(*
ID, MCI))
631 return std::move(Err);
634 bool IsVariadic = MCDesc.isVariadic();
635 if ((
ID->IsRecyclable = !IsVariadic && !IsVariant)) {
636 auto DKey = std::make_pair(MCI.getOpcode(), SchedClassID);
637 Descriptors[DKey] = std::move(
ID);
638 return *Descriptors[DKey];
641 auto VDKey = std::make_pair(
hashMCInst(MCI), SchedClassID);
643 !VariantDescriptors.contains(VDKey) &&
644 "Expected VariantDescriptors to not already have a value for this key.");
645 VariantDescriptors[VDKey] = std::move(
ID);
646 return *VariantDescriptors[VDKey];
649Expected<const InstrDesc &>
650InstrBuilder::getOrCreateInstrDesc(
const MCInst &MCI,
651 const SmallVector<Instrument *> &IVec) {
655 auto DKey = std::make_pair(MCI.getOpcode(), SchedClassID);
656 if (Descriptors.find_as(DKey) != Descriptors.end())
657 return *Descriptors[DKey];
659 Expected<unsigned> VariantSchedClassIDOrErr =
660 getVariantSchedClassID(MCI, SchedClassID);
661 if (!VariantSchedClassIDOrErr) {
662 return VariantSchedClassIDOrErr.takeError();
665 SchedClassID = *VariantSchedClassIDOrErr;
667 auto VDKey = std::make_pair(
hashMCInst(MCI), SchedClassID);
668 if (VariantDescriptors.contains(VDKey))
669 return *VariantDescriptors[VDKey];
671 return createInstrDescImpl(MCI, IVec);
674STATISTIC(NumVariantInst,
"Number of MCInsts that doesn't have static Desc");
684 std::unique_ptr<Instruction> CreatedIS;
685 bool IsInstRecycled =
false;
690 if (
D.IsRecyclable && InstRecycleCB) {
691 if (
auto *
I = InstRecycleCB(
D)) {
694 IsInstRecycled =
true;
697 if (!IsInstRecycled) {
698 CreatedIS = std::make_unique<Instruction>(
D, MCI.
getOpcode());
699 NewIS = CreatedIS.get();
716 bool IsZeroIdiom =
false;
717 bool IsDepBreaking =
false;
720 IsZeroIdiom = MCIA->
isZeroIdiom(MCI, Mask, ProcID);
749 if (IsInstRecycled && Idx < NewIS->getUses().
size()) {
753 NewIS->
getUses().emplace_back(RD, RegID);
770 if (Mask.getBitWidth() > RD.
UseIndex) {
778 if (IsInstRecycled && Idx < NewIS->getUses().
size())
782 if (
D.Writes.empty()) {
784 return llvm::make_error<RecycledInstErr>(NewIS);
786 return std::move(CreatedIS);
791 APInt WriteMask(
D.Writes.size(), 0);
799 unsigned WriteIndex = 0;
811 assert(RegID &&
"Expected a valid register ID!");
812 if (IsInstRecycled && Idx < NewIS->getDefs().
size()) {
815 WriteMask[WriteIndex],
818 NewIS->
getDefs().emplace_back(WD, RegID,
819 WriteMask[WriteIndex],
825 if (IsInstRecycled && Idx < NewIS->getDefs().
size())
829 return llvm::make_error<RecycledInstErr>(NewIS);
831 return std::move(CreatedIS);
unsigned const MachineRegisterInfo * MRI
This file implements a class to represent arbitrary precision integral constant values and operations...
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
This file defines the DenseMap class.
A builder class for instructions that are statically analyzed by llvm-mca.
while(!ToSimplify.empty())
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Class for arbitrary precision integers.
uint64_t getZExtValue() const
Get zero extended value.
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
This class represents an Operation in the Expression.
Subclass of Error for the sole purpose of identifying the success path in the type system.
Lightweight error class with error context and mandatory checking.
Tagged union holding either a T or a Error.
Error takeError()
Take ownership of the stored error.
Instances of this class represent a single low-level machine instruction.
unsigned getNumOperands() const
unsigned getFlags() const
unsigned getOpcode() const
const MCOperand & getOperand(unsigned i) const
virtual bool isOptimizableRegisterMove(const MCInst &MI, unsigned CPUID) const
Returns true if MI is a candidate for move elimination.
virtual bool isDependencyBreaking(const MCInst &MI, APInt &Mask, unsigned CPUID) const
Returns true if MI is a dependency breaking instruction for the subtarget associated with CPUID .
virtual bool isZeroIdiom(const MCInst &MI, APInt &Mask, unsigned CPUID) const
Returns true if MI is a dependency breaking zero-idiom for the given subtarget.
virtual bool clearsSuperRegisters(const MCRegisterInfo &MRI, const MCInst &Inst, APInt &Writes) const
Returns true if at least one of the register writes performed by.
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
ArrayRef< MCOperandInfo > operands() const
bool mayStore() const
Return true if this instruction could possibly modify memory.
bool mayLoad() const
Return true if this instruction could possibly read memory.
bool hasOptionalDef() const
Set if this instruction has an optional definition, e.g.
unsigned getNumDefs() const
Return the number of MachineOperands that are register definitions.
bool variadicOpsAreDefs() const
Return true if variadic operands of this instruction are definitions.
ArrayRef< MCPhysReg > implicit_defs() const
Return a list of registers that are potentially written by any instance of this machine instruction.
bool hasUnmodeledSideEffects() const
Return true if this instruction has side effects that are not modeled by other flags.
bool isCall() const
Return true if the instruction is a call.
Interface to description of machine instruction set.
const MCInstrDesc & get(unsigned Opcode) const
Return the machine instruction descriptor that corresponds to the specified instruction opcode.
StringRef getName(unsigned Opcode) const
Returns the name for the instructions with the given opcode.
Instances of this class represent operands of the MCInst class.
unsigned getReg() const
Returns the register number.
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
const char * getName(MCRegister RegNo) const
Return the human-readable symbolic target-specific name for the specified physical register.
bool isConstant(MCRegister RegNo) const
Returns true if the given register is constant.
Generic base class for all target subtargets.
virtual unsigned resolveVariantSchedClass(unsigned SchedClass, const MCInst *MI, const MCInstrInfo *MCII, unsigned CPUID) const
Resolve a variant scheduling class for the given MCInst and CPU.
const MCWriteLatencyEntry * getWriteLatencyEntry(const MCSchedClassDesc *SC, unsigned DefIdx) const
const MCWriteProcResEntry * getWriteProcResBegin(const MCSchedClassDesc *SC) const
Return an iterator at the first process resource consumed by the given scheduling class.
const MCSchedModel & getSchedModel() const
Get the machine model for this subtarget's CPU.
reference emplace_back(ArgTypes &&... Args)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
static raw_ostream & warning()
Convenience method for printing "warning: " to stderr.
static raw_ostream & note()
Convenience method for printing "note: " to stderr.
An opaque object representing a hash code.
Expected< std::unique_ptr< Instruction > > createInstruction(const MCInst &MCI, const SmallVector< Instrument * > &IVec)
void setEndGroup(bool newVal)
void setRetireOOO(bool newVal)
SmallVectorImpl< WriteState > & getDefs()
void setBeginGroup(bool newVal)
SmallVectorImpl< ReadState > & getUses()
void setHasSideEffects(bool newVal)
void setMayStore(bool newVal)
void setOptimizableMove()
void setMayLoad(bool newVal)
An instruction propagated through the simulated instruction pipeline.
This class allows targets to optionally customize the logic that resolves scheduling class IDs.
virtual unsigned getSchedClassID(const MCInstrInfo &MCII, const MCInst &MCI, const SmallVector< Instrument * > &IVec) const
Given an MCInst and a vector of Instrument, a target can return a SchedClassID.
Tracks register operand latency in cycles.
void setIndependentFromDef()
Tracks uses of a register definition (e.g.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
hash_code hashMCInst(const MCInst &MCI)
static void initializeUsedResources(InstrDesc &ID, const MCSchedClassDesc &SCDesc, const MCSubtargetInfo &STI, ArrayRef< uint64_t > ProcResourceMasks)
hash_code hashMCOperand(const MCOperand &MCO)
static void computeMaxLatency(InstrDesc &ID, const MCInstrDesc &MCDesc, const MCSchedClassDesc &SCDesc, const MCSubtargetInfo &STI, unsigned CallLatency)
void computeProcResourceMasks(const MCSchedModel &SM, MutableArrayRef< uint64_t > Masks)
Populates vector Masks with processor resource masks.
unsigned getResourceStateIndex(uint64_t Mask)
static Error verifyOperands(const MCInstrDesc &MCDesc, const MCInst &MCI)
This is an optimization pass for GlobalISel generic memory operations.
int popcount(T Value) noexcept
Count the number of set bits in a value.
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
void sort(IteratorTy Start, IteratorTy End)
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
FormattedNumber format_hex(uint64_t N, unsigned Width, bool Upper=false)
format_hex - Output N as a fixed width hexadecimal.
DWARFExpression::Operation Op
hash_code hash_combine(const Ts &...args)
Combine values into a single hash_code.
T bit_floor(T Value)
Returns the largest integral power of two no greater than Value if Value is nonzero.
Define a kind of processor resource that will be modeled by the scheduler.
Summarize the scheduling resources required for an instruction of a particular scheduling class.
static const unsigned short InvalidNumMicroOps
uint16_t NumWriteLatencyEntries
uint16_t NumWriteProcResEntries
Machine model for scheduling, bundling, and heuristics.
const MCSchedClassDesc * getSchedClassDesc(unsigned SchedClassIdx) const
unsigned getProcessorID() const
unsigned getNumProcResourceKinds() const
bool hasInstrSchedModel() const
Does this machine model include instruction-level scheduling.
static int computeInstrLatency(const MCSubtargetInfo &STI, const MCSchedClassDesc &SCDesc)
Returns the latency value for the scheduling class.
const MCProcResourceDesc * getProcResource(unsigned ProcResourceIdx) const
Identify one of the processor resource kinds consumed by a particular scheduling class for the specif...
uint16_t ReleaseAtCycle
Cycle at which the resource will be released by an instruction, relatively to the cycle in which the ...
An instruction descriptor.
A register read descriptor.
bool isImplicitRead() const
Helper used by class InstrDesc to describe how hardware resources are used.
A register write descriptor.
bool isImplicitWrite() const