//=- llvm/CodeGen/DFAPacketizer.cpp - DFA Packetizer for VLIW -*- C++ -*-=====// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // This class implements a deterministic finite automaton (DFA) based // packetizing mechanism for VLIW architectures. It provides APIs to // determine whether there exists a legal mapping of instructions to // functional unit assignments in a packet. The DFA is auto-generated from // the target's Schedule.td file. // // A DFA consists of 3 major elements: states, inputs, and transitions. For // the packetizing mechanism, the input is the set of instruction classes for // a target. The state models all possible combinations of functional unit // consumption for a given set of instructions in a packet. A transition // models the addition of an instruction to a packet. In the DFA constructed // by this class, if an instruction can be added to a packet, then a valid // transition exists from the corresponding state. Invalid transitions // indicate that the instruction cannot be added to the current packet. // //===----------------------------------------------------------------------===// #include "llvm/CodeGen/DFAPacketizer.h" #include "llvm/ADT/StringExtras.h" #include "llvm/Analysis/AliasAnalysis.h" #include "llvm/CodeGen/MachineFunction.h" #include "llvm/CodeGen/MachineInstr.h" #include "llvm/CodeGen/MachineInstrBundle.h" #include "llvm/CodeGen/ScheduleDAG.h" #include "llvm/CodeGen/TargetInstrInfo.h" #include "llvm/CodeGen/TargetSubtargetInfo.h" #include "llvm/MC/MCInstrDesc.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Debug.h" #include "llvm/Support/raw_ostream.h" #include #include #include #include #include using namespace llvm; #define DEBUG_TYPE "packets" static cl::opt InstrLimit("dfa-instr-limit", cl::Hidden, cl::init(0), cl::desc("If present, stops packetizing after N instructions")); static unsigned InstrCount = 0; // Check if the resources occupied by a MCInstrDesc are available in the // current state. bool DFAPacketizer::canReserveResources(const MCInstrDesc *MID) { unsigned Action = ItinActions[MID->getSchedClass()]; if (MID->getSchedClass() == 0 || Action == 0) return false; return A.canAdd(Action); } // Reserve the resources occupied by a MCInstrDesc and change the current // state to reflect that change. void DFAPacketizer::reserveResources(const MCInstrDesc *MID) { unsigned Action = ItinActions[MID->getSchedClass()]; if (MID->getSchedClass() == 0 || Action == 0) return; A.add(Action); } // Check if the resources occupied by a machine instruction are available // in the current state. bool DFAPacketizer::canReserveResources(MachineInstr &MI) { const MCInstrDesc &MID = MI.getDesc(); return canReserveResources(&MID); } // Reserve the resources occupied by a machine instruction and change the // current state to reflect that change. void DFAPacketizer::reserveResources(MachineInstr &MI) { const MCInstrDesc &MID = MI.getDesc(); reserveResources(&MID); } unsigned DFAPacketizer::getUsedResources(unsigned InstIdx) { ArrayRef NfaPaths = A.getNfaPaths(); assert(!NfaPaths.empty() && "Invalid bundle!"); const NfaPath &RS = NfaPaths.front(); // RS stores the cumulative resources used up to and including the I'th // instruction. The 0th instruction is the base case. if (InstIdx == 0) return RS[0]; // Return the difference between the cumulative resources used by InstIdx and // its predecessor. return RS[InstIdx] ^ RS[InstIdx - 1]; } DefaultVLIWScheduler::DefaultVLIWScheduler(MachineFunction &MF, MachineLoopInfo &MLI, AAResults *AA) : ScheduleDAGInstrs(MF, &MLI), AA(AA) { CanHandleTerminators = true; } /// Apply each ScheduleDAGMutation step in order. void DefaultVLIWScheduler::postProcessDAG() { for (auto &M : Mutations) M->apply(this); } void DefaultVLIWScheduler::schedule() { // Build the scheduling graph. buildSchedGraph(AA); postProcessDAG(); } VLIWPacketizerList::VLIWPacketizerList(MachineFunction &mf, MachineLoopInfo &mli, AAResults *aa) : MF(mf), TII(mf.getSubtarget().getInstrInfo()), AA(aa) { ResourceTracker = TII->CreateTargetScheduleState(MF.getSubtarget()); ResourceTracker->setTrackResources(true); VLIWScheduler = new DefaultVLIWScheduler(MF, mli, AA); } VLIWPacketizerList::~VLIWPacketizerList() { delete VLIWScheduler; delete ResourceTracker; } // End the current packet, bundle packet instructions and reset DFA state. void VLIWPacketizerList::endPacket(MachineBasicBlock *MBB, MachineBasicBlock::iterator MI) { LLVM_DEBUG({ if (!CurrentPacketMIs.empty()) { dbgs() << "Finalizing packet:\n"; unsigned Idx = 0; for (MachineInstr *MI : CurrentPacketMIs) { unsigned R = ResourceTracker->getUsedResources(Idx++); dbgs() << " * [res:0x" << utohexstr(R) << "] " << *MI; } } }); if (CurrentPacketMIs.size() > 1) { MachineInstr &MIFirst = *CurrentPacketMIs.front(); finalizeBundle(*MBB, MIFirst.getIterator(), MI.getInstrIterator()); } CurrentPacketMIs.clear(); ResourceTracker->clearResources(); LLVM_DEBUG(dbgs() << "End packet\n"); } // Bundle machine instructions into packets. void VLIWPacketizerList::PacketizeMIs(MachineBasicBlock *MBB, MachineBasicBlock::iterator BeginItr, MachineBasicBlock::iterator EndItr) { assert(VLIWScheduler && "VLIW Scheduler is not initialized!"); VLIWScheduler->startBlock(MBB); VLIWScheduler->enterRegion(MBB, BeginItr, EndItr, std::distance(BeginItr, EndItr)); VLIWScheduler->schedule(); LLVM_DEBUG({ dbgs() << "Scheduling DAG of the packetize region\n"; VLIWScheduler->dump(); }); // Generate MI -> SU map. MIToSUnit.clear(); for (SUnit &SU : VLIWScheduler->SUnits) MIToSUnit[SU.getInstr()] = &SU; bool LimitPresent = InstrLimit.getPosition(); // The main packetizer loop. for (; BeginItr != EndItr; ++BeginItr) { if (LimitPresent) { if (InstrCount >= InstrLimit) { EndItr = BeginItr; break; } InstrCount++; } MachineInstr &MI = *BeginItr; initPacketizerState(); // End the current packet if needed. if (isSoloInstruction(MI)) { endPacket(MBB, MI); continue; } // Ignore pseudo instructions. if (ignorePseudoInstruction(MI, MBB)) continue; SUnit *SUI = MIToSUnit[&MI]; assert(SUI && "Missing SUnit Info!"); // Ask DFA if machine resource is available for MI. LLVM_DEBUG(dbgs() << "Checking resources for adding MI to packet " << MI); bool ResourceAvail = ResourceTracker->canReserveResources(MI); LLVM_DEBUG({ if (ResourceAvail) dbgs() << " Resources are available for adding MI to packet\n"; else dbgs() << " Resources NOT available\n"; }); if (ResourceAvail && shouldAddToPacket(MI)) { // Dependency check for MI with instructions in CurrentPacketMIs. for (auto *MJ : CurrentPacketMIs) { SUnit *SUJ = MIToSUnit[MJ]; assert(SUJ && "Missing SUnit Info!"); LLVM_DEBUG(dbgs() << " Checking against MJ " << *MJ); // Is it legal to packetize SUI and SUJ together. if (!isLegalToPacketizeTogether(SUI, SUJ)) { LLVM_DEBUG(dbgs() << " Not legal to add MI, try to prune\n"); // Allow packetization if dependency can be pruned. if (!isLegalToPruneDependencies(SUI, SUJ)) { // End the packet if dependency cannot be pruned. LLVM_DEBUG(dbgs() << " Could not prune dependencies for adding MI\n"); endPacket(MBB, MI); break; } LLVM_DEBUG(dbgs() << " Pruned dependence for adding MI\n"); } } } else { LLVM_DEBUG(if (ResourceAvail) dbgs() << "Resources are available, but instruction should not be " "added to packet\n " << MI); // End the packet if resource is not available, or if the instruction // should not be added to the current packet. endPacket(MBB, MI); } // Add MI to the current packet. LLVM_DEBUG(dbgs() << "* Adding MI to packet " << MI << '\n'); BeginItr = addToPacket(MI); } // For all instructions in the packetization range. // End any packet left behind. endPacket(MBB, EndItr); VLIWScheduler->exitRegion(); VLIWScheduler->finishBlock(); } bool VLIWPacketizerList::alias(const MachineMemOperand &Op1, const MachineMemOperand &Op2, bool UseTBAA) const { if (!Op1.getValue() || !Op2.getValue()) return true; int64_t MinOffset = std::min(Op1.getOffset(), Op2.getOffset()); int64_t Overlapa = Op1.getSize() + Op1.getOffset() - MinOffset; int64_t Overlapb = Op2.getSize() + Op2.getOffset() - MinOffset; AliasResult AAResult = AA->alias(MemoryLocation(Op1.getValue(), Overlapa, UseTBAA ? Op1.getAAInfo() : AAMDNodes()), MemoryLocation(Op2.getValue(), Overlapb, UseTBAA ? Op2.getAAInfo() : AAMDNodes())); return AAResult != AliasResult::NoAlias; } bool VLIWPacketizerList::alias(const MachineInstr &MI1, const MachineInstr &MI2, bool UseTBAA) const { if (MI1.memoperands_empty() || MI2.memoperands_empty()) return true; for (const MachineMemOperand *Op1 : MI1.memoperands()) for (const MachineMemOperand *Op2 : MI2.memoperands()) if (alias(*Op1, *Op2, UseTBAA)) return true; return false; } // Add a DAG mutation object to the ordered list. void VLIWPacketizerList::addMutation( std::unique_ptr Mutation) { VLIWScheduler->addMutation(std::move(Mutation)); }