123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418 |
- //=- llvm/CodeGen/DFAPacketizer.cpp - DFA Packetizer for VLIW -*- C++ -*-=====//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- // This class implements a deterministic finite automaton (DFA) based
- // packetizing mechanism for VLIW architectures. It provides APIs to
- // determine whether there exists a legal mapping of instructions to
- // functional unit assignments in a packet. The DFA is auto-generated from
- // the target's Schedule.td file.
- //
- // A DFA consists of 3 major elements: states, inputs, and transitions. For
- // the packetizing mechanism, the input is the set of instruction classes for
- // a target. The state models all possible combinations of functional unit
- // consumption for a given set of instructions in a packet. A transition
- // models the addition of an instruction to a packet. In the DFA constructed
- // by this class, if an instruction can be added to a packet, then a valid
- // transition exists from the corresponding state. Invalid transitions
- // indicate that the instruction cannot be added to the current packet.
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/CodeGen/DFAPacketizer.h"
- #include "llvm/ADT/StringExtras.h"
- #include "llvm/CodeGen/MachineFunction.h"
- #include "llvm/CodeGen/MachineInstr.h"
- #include "llvm/CodeGen/MachineInstrBundle.h"
- #include "llvm/CodeGen/ScheduleDAG.h"
- #include "llvm/CodeGen/ScheduleDAGInstrs.h"
- #include "llvm/CodeGen/TargetInstrInfo.h"
- #include "llvm/CodeGen/TargetSubtargetInfo.h"
- #include "llvm/MC/MCInstrDesc.h"
- #include "llvm/MC/MCInstrItineraries.h"
- #include "llvm/Support/CommandLine.h"
- #include "llvm/Support/Debug.h"
- #include "llvm/Support/raw_ostream.h"
- #include <algorithm>
- #include <cassert>
- #include <iterator>
- #include <memory>
- #include <vector>
- using namespace llvm;
- #define DEBUG_TYPE "packets"
- static cl::opt<unsigned> InstrLimit("dfa-instr-limit", cl::Hidden,
- cl::init(0), cl::desc("If present, stops packetizing after N instructions"));
- static unsigned InstrCount = 0;
- // --------------------------------------------------------------------
- // Definitions shared between DFAPacketizer.cpp and DFAPacketizerEmitter.cpp
- static DFAInput addDFAFuncUnits(DFAInput Inp, unsigned FuncUnits) {
- return (Inp << DFA_MAX_RESOURCES) | FuncUnits;
- }
- /// Return the DFAInput for an instruction class input vector.
- /// This function is used in both DFAPacketizer.cpp and in
- /// DFAPacketizerEmitter.cpp.
- static DFAInput getDFAInsnInput(const std::vector<unsigned> &InsnClass) {
- DFAInput InsnInput = 0;
- assert((InsnClass.size() <= DFA_MAX_RESTERMS) &&
- "Exceeded maximum number of DFA terms");
- for (auto U : InsnClass)
- InsnInput = addDFAFuncUnits(InsnInput, U);
- return InsnInput;
- }
- // --------------------------------------------------------------------
- DFAPacketizer::DFAPacketizer(const InstrItineraryData *I,
- const DFAStateInput (*SIT)[2], const unsigned *SET,
- const unsigned (*RTT)[2],
- const unsigned *RTET)
- : InstrItins(I), DFAStateInputTable(SIT), DFAStateEntryTable(SET),
- DFAResourceTransitionTable(RTT), DFAResourceTransitionEntryTable(RTET) {
- // Make sure DFA types are large enough for the number of terms & resources.
- static_assert((DFA_MAX_RESTERMS * DFA_MAX_RESOURCES) <=
- (8 * sizeof(DFAInput)),
- "(DFA_MAX_RESTERMS * DFA_MAX_RESOURCES) too big for DFAInput");
- static_assert(
- (DFA_MAX_RESTERMS * DFA_MAX_RESOURCES) <= (8 * sizeof(DFAStateInput)),
- "(DFA_MAX_RESTERMS * DFA_MAX_RESOURCES) too big for DFAStateInput");
- clearResources();
- }
- // Read the DFA transition table and update CachedTable.
- //
- // Format of the transition tables:
- // DFAStateInputTable[][2] = pairs of <Input, Transition> for all valid
- // transitions
- // DFAStateEntryTable[i] = Index of the first entry in DFAStateInputTable
- // for the ith state
- //
- void DFAPacketizer::ReadTable(unsigned int state) {
- unsigned ThisStateIdx = DFAStateEntryTable[state];
- unsigned NextStateIdxInTable = DFAStateEntryTable[state + 1];
- // Early exit in case CachedTable has already contains this
- // state's transitions.
- if (CachedTable.count(UnsignPair(state, DFAStateInputTable[ThisStateIdx][0])))
- return;
- for (unsigned TransitionIdx = ThisStateIdx;
- TransitionIdx < NextStateIdxInTable; TransitionIdx++) {
- auto TransitionPair =
- UnsignPair(state, DFAStateInputTable[TransitionIdx][0]);
- CachedTable[TransitionPair] = DFAStateInputTable[TransitionIdx][1];
- if (TrackResources) {
- unsigned I = DFAResourceTransitionEntryTable[TransitionIdx];
- unsigned E = DFAResourceTransitionEntryTable[TransitionIdx + 1];
- CachedResourceTransitions[TransitionPair] = makeArrayRef(
- &DFAResourceTransitionTable[I], &DFAResourceTransitionTable[E]);
- }
- }
- }
- // Return the DFAInput for an instruction class.
- DFAInput DFAPacketizer::getInsnInput(unsigned InsnClass) {
- // Note: this logic must match that in DFAPacketizerDefs.h for input vectors.
- DFAInput InsnInput = 0;
- unsigned i = 0;
- (void)i;
- for (const InstrStage *IS = InstrItins->beginStage(InsnClass),
- *IE = InstrItins->endStage(InsnClass); IS != IE; ++IS) {
- InsnInput = addDFAFuncUnits(InsnInput, IS->getUnits());
- assert((i++ < DFA_MAX_RESTERMS) && "Exceeded maximum number of DFA inputs");
- }
- return InsnInput;
- }
- // Return the DFAInput for an instruction class input vector.
- DFAInput DFAPacketizer::getInsnInput(const std::vector<unsigned> &InsnClass) {
- return getDFAInsnInput(InsnClass);
- }
- // Check if the resources occupied by a MCInstrDesc are available in the
- // current state.
- bool DFAPacketizer::canReserveResources(const MCInstrDesc *MID) {
- unsigned InsnClass = MID->getSchedClass();
- DFAInput InsnInput = getInsnInput(InsnClass);
- UnsignPair StateTrans = UnsignPair(CurrentState, InsnInput);
- ReadTable(CurrentState);
- return CachedTable.count(StateTrans) != 0;
- }
- // Reserve the resources occupied by a MCInstrDesc and change the current
- // state to reflect that change.
- void DFAPacketizer::reserveResources(const MCInstrDesc *MID) {
- unsigned InsnClass = MID->getSchedClass();
- DFAInput InsnInput = getInsnInput(InsnClass);
- UnsignPair StateTrans = UnsignPair(CurrentState, InsnInput);
- ReadTable(CurrentState);
- if (TrackResources) {
- DenseMap<unsigned, SmallVector<unsigned, 8>> NewResourceStates;
- for (const auto &KV : CachedResourceTransitions[StateTrans]) {
- assert(ResourceStates.count(KV[0]));
- NewResourceStates[KV[1]] = ResourceStates[KV[0]];
- NewResourceStates[KV[1]].push_back(KV[1]);
- }
- ResourceStates = NewResourceStates;
- }
- assert(CachedTable.count(StateTrans) != 0);
- CurrentState = CachedTable[StateTrans];
- }
- // Check if the resources occupied by a machine instruction are available
- // in the current state.
- bool DFAPacketizer::canReserveResources(MachineInstr &MI) {
- const MCInstrDesc &MID = MI.getDesc();
- return canReserveResources(&MID);
- }
- // Reserve the resources occupied by a machine instruction and change the
- // current state to reflect that change.
- void DFAPacketizer::reserveResources(MachineInstr &MI) {
- const MCInstrDesc &MID = MI.getDesc();
- reserveResources(&MID);
- }
- unsigned DFAPacketizer::getUsedResources(unsigned InstIdx) {
- assert(TrackResources && "getUsedResources requires resource tracking!");
- // Assert that there is at least one example of a valid bundle format.
- assert(!ResourceStates.empty() && "Invalid bundle!");
- SmallVectorImpl<unsigned> &RS = ResourceStates.begin()->second;
- // RS stores the cumulative resources used up to and including the I'th
- // instruction. The 0th instruction is the base case.
- if (InstIdx == 0)
- return RS[0];
- // Return the difference between the cumulative resources used by InstIdx and
- // its predecessor.
- return RS[InstIdx] ^ RS[InstIdx - 1];
- }
- namespace llvm {
- // This class extends ScheduleDAGInstrs and overrides the schedule method
- // to build the dependence graph.
- class DefaultVLIWScheduler : public ScheduleDAGInstrs {
- private:
- AliasAnalysis *AA;
- /// Ordered list of DAG postprocessing steps.
- std::vector<std::unique_ptr<ScheduleDAGMutation>> Mutations;
- public:
- DefaultVLIWScheduler(MachineFunction &MF, MachineLoopInfo &MLI,
- AliasAnalysis *AA);
- // Actual scheduling work.
- void schedule() override;
- /// DefaultVLIWScheduler takes ownership of the Mutation object.
- void addMutation(std::unique_ptr<ScheduleDAGMutation> Mutation) {
- Mutations.push_back(std::move(Mutation));
- }
- protected:
- void postprocessDAG();
- };
- } // end namespace llvm
- DefaultVLIWScheduler::DefaultVLIWScheduler(MachineFunction &MF,
- MachineLoopInfo &MLI,
- AliasAnalysis *AA)
- : ScheduleDAGInstrs(MF, &MLI), AA(AA) {
- CanHandleTerminators = true;
- }
- /// Apply each ScheduleDAGMutation step in order.
- void DefaultVLIWScheduler::postprocessDAG() {
- for (auto &M : Mutations)
- M->apply(this);
- }
- void DefaultVLIWScheduler::schedule() {
- // Build the scheduling graph.
- buildSchedGraph(AA);
- postprocessDAG();
- }
- VLIWPacketizerList::VLIWPacketizerList(MachineFunction &mf,
- MachineLoopInfo &mli, AliasAnalysis *aa)
- : MF(mf), TII(mf.getSubtarget().getInstrInfo()), AA(aa) {
- ResourceTracker = TII->CreateTargetScheduleState(MF.getSubtarget());
- ResourceTracker->setTrackResources(true);
- VLIWScheduler = new DefaultVLIWScheduler(MF, mli, AA);
- }
- VLIWPacketizerList::~VLIWPacketizerList() {
- delete VLIWScheduler;
- delete ResourceTracker;
- }
- // End the current packet, bundle packet instructions and reset DFA state.
- void VLIWPacketizerList::endPacket(MachineBasicBlock *MBB,
- MachineBasicBlock::iterator MI) {
- LLVM_DEBUG({
- if (!CurrentPacketMIs.empty()) {
- dbgs() << "Finalizing packet:\n";
- unsigned Idx = 0;
- for (MachineInstr *MI : CurrentPacketMIs) {
- unsigned R = ResourceTracker->getUsedResources(Idx++);
- dbgs() << " * [res:0x" << utohexstr(R) << "] " << *MI;
- }
- }
- });
- if (CurrentPacketMIs.size() > 1) {
- MachineInstr &MIFirst = *CurrentPacketMIs.front();
- finalizeBundle(*MBB, MIFirst.getIterator(), MI.getInstrIterator());
- }
- CurrentPacketMIs.clear();
- ResourceTracker->clearResources();
- LLVM_DEBUG(dbgs() << "End packet\n");
- }
- // Bundle machine instructions into packets.
- void VLIWPacketizerList::PacketizeMIs(MachineBasicBlock *MBB,
- MachineBasicBlock::iterator BeginItr,
- MachineBasicBlock::iterator EndItr) {
- assert(VLIWScheduler && "VLIW Scheduler is not initialized!");
- VLIWScheduler->startBlock(MBB);
- VLIWScheduler->enterRegion(MBB, BeginItr, EndItr,
- std::distance(BeginItr, EndItr));
- VLIWScheduler->schedule();
- LLVM_DEBUG({
- dbgs() << "Scheduling DAG of the packetize region\n";
- VLIWScheduler->dump();
- });
- // Generate MI -> SU map.
- MIToSUnit.clear();
- for (SUnit &SU : VLIWScheduler->SUnits)
- MIToSUnit[SU.getInstr()] = &SU;
- bool LimitPresent = InstrLimit.getPosition();
- // The main packetizer loop.
- for (; BeginItr != EndItr; ++BeginItr) {
- if (LimitPresent) {
- if (InstrCount >= InstrLimit) {
- EndItr = BeginItr;
- break;
- }
- InstrCount++;
- }
- MachineInstr &MI = *BeginItr;
- initPacketizerState();
- // End the current packet if needed.
- if (isSoloInstruction(MI)) {
- endPacket(MBB, MI);
- continue;
- }
- // Ignore pseudo instructions.
- if (ignorePseudoInstruction(MI, MBB))
- continue;
- SUnit *SUI = MIToSUnit[&MI];
- assert(SUI && "Missing SUnit Info!");
- // Ask DFA if machine resource is available for MI.
- LLVM_DEBUG(dbgs() << "Checking resources for adding MI to packet " << MI);
- bool ResourceAvail = ResourceTracker->canReserveResources(MI);
- LLVM_DEBUG({
- if (ResourceAvail)
- dbgs() << " Resources are available for adding MI to packet\n";
- else
- dbgs() << " Resources NOT available\n";
- });
- if (ResourceAvail && shouldAddToPacket(MI)) {
- // Dependency check for MI with instructions in CurrentPacketMIs.
- for (auto MJ : CurrentPacketMIs) {
- SUnit *SUJ = MIToSUnit[MJ];
- assert(SUJ && "Missing SUnit Info!");
- LLVM_DEBUG(dbgs() << " Checking against MJ " << *MJ);
- // Is it legal to packetize SUI and SUJ together.
- if (!isLegalToPacketizeTogether(SUI, SUJ)) {
- LLVM_DEBUG(dbgs() << " Not legal to add MI, try to prune\n");
- // Allow packetization if dependency can be pruned.
- if (!isLegalToPruneDependencies(SUI, SUJ)) {
- // End the packet if dependency cannot be pruned.
- LLVM_DEBUG(dbgs()
- << " Could not prune dependencies for adding MI\n");
- endPacket(MBB, MI);
- break;
- }
- LLVM_DEBUG(dbgs() << " Pruned dependence for adding MI\n");
- }
- }
- } else {
- LLVM_DEBUG(if (ResourceAvail) dbgs()
- << "Resources are available, but instruction should not be "
- "added to packet\n "
- << MI);
- // End the packet if resource is not available, or if the instruction
- // shoud not be added to the current packet.
- endPacket(MBB, MI);
- }
- // Add MI to the current packet.
- LLVM_DEBUG(dbgs() << "* Adding MI to packet " << MI << '\n');
- BeginItr = addToPacket(MI);
- } // For all instructions in the packetization range.
- // End any packet left behind.
- endPacket(MBB, EndItr);
- VLIWScheduler->exitRegion();
- VLIWScheduler->finishBlock();
- }
- bool VLIWPacketizerList::alias(const MachineMemOperand &Op1,
- const MachineMemOperand &Op2,
- bool UseTBAA) const {
- if (!Op1.getValue() || !Op2.getValue())
- return true;
- int64_t MinOffset = std::min(Op1.getOffset(), Op2.getOffset());
- int64_t Overlapa = Op1.getSize() + Op1.getOffset() - MinOffset;
- int64_t Overlapb = Op2.getSize() + Op2.getOffset() - MinOffset;
- AliasResult AAResult =
- AA->alias(MemoryLocation(Op1.getValue(), Overlapa,
- UseTBAA ? Op1.getAAInfo() : AAMDNodes()),
- MemoryLocation(Op2.getValue(), Overlapb,
- UseTBAA ? Op2.getAAInfo() : AAMDNodes()));
- return AAResult != NoAlias;
- }
- bool VLIWPacketizerList::alias(const MachineInstr &MI1,
- const MachineInstr &MI2,
- bool UseTBAA) const {
- if (MI1.memoperands_empty() || MI2.memoperands_empty())
- return true;
- for (const MachineMemOperand *Op1 : MI1.memoperands())
- for (const MachineMemOperand *Op2 : MI2.memoperands())
- if (alias(*Op1, *Op2, UseTBAA))
- return true;
- return false;
- }
- // Add a DAG mutation object to the ordered list.
- void VLIWPacketizerList::addMutation(
- std::unique_ptr<ScheduleDAGMutation> Mutation) {
- VLIWScheduler->addMutation(std::move(Mutation));
- }
|