blob: 3cff31ad4933588135cf9efd0a4a9d947d5016ed [file] [log] [blame]
Eugene Zelenko90d99202017-02-27 22:45:06 +00001//===- llvm/Target/TargetSchedule.cpp - Sched Machine Model ---------------===//
Andrew Trick99ab6c62012-09-14 20:26:46 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements a wrapper around MCSchedModel that allows the interface
11// to benefit from information currently only available in TargetInstrInfo.
12//
13//===----------------------------------------------------------------------===//
14
Chandler Carruthe3e43d92017-06-06 11:49:48 +000015#include "llvm/CodeGen/TargetSchedule.h"
Eugene Zelenko90d99202017-02-27 22:45:06 +000016#include "llvm/CodeGen/MachineFunction.h"
17#include "llvm/CodeGen/MachineInstr.h"
18#include "llvm/CodeGen/MachineOperand.h"
David Blaikie48319232017-11-08 01:01:31 +000019#include "llvm/CodeGen/TargetInstrInfo.h"
David Blaikiee3a9b4c2017-11-17 01:07:10 +000020#include "llvm/CodeGen/TargetRegisterInfo.h"
21#include "llvm/CodeGen/TargetSubtargetInfo.h"
Eugene Zelenko90d99202017-02-27 22:45:06 +000022#include "llvm/MC/MCInstrDesc.h"
23#include "llvm/MC/MCInstrItineraries.h"
24#include "llvm/MC/MCSchedule.h"
Chandler Carruthd04a8d42012-12-03 16:50:05 +000025#include "llvm/Support/CommandLine.h"
Eugene Zelenko90d99202017-02-27 22:45:06 +000026#include "llvm/Support/ErrorHandling.h"
Chandler Carruthd04a8d42012-12-03 16:50:05 +000027#include "llvm/Support/raw_ostream.h"
Eugene Zelenko90d99202017-02-27 22:45:06 +000028#include <algorithm>
29#include <cassert>
30#include <cstdint>
Andrew Trick99ab6c62012-09-14 20:26:46 +000031
32using namespace llvm;
33
Andrew Trick72fd0a92012-10-04 00:24:34 +000034static cl::opt<bool> EnableSchedModel("schedmodel", cl::Hidden, cl::init(true),
Andrew Trick99ab6c62012-09-14 20:26:46 +000035 cl::desc("Use TargetSchedModel for latency lookup"));
36
Andrew Trick34301ce2012-09-18 04:03:34 +000037static cl::opt<bool> EnableSchedItins("scheditins", cl::Hidden, cl::init(true),
38 cl::desc("Use InstrItineraryData for latency lookup"));
39
Andrew Trick42bb1062012-10-09 23:44:26 +000040bool TargetSchedModel::hasInstrSchedModel() const {
41 return EnableSchedModel && SchedModel.hasInstrSchedModel();
42}
43
44bool TargetSchedModel::hasInstrItineraries() const {
45 return EnableSchedItins && !InstrItins.isEmpty();
46}
47
Andrew Trick8d4abb22012-11-06 07:10:38 +000048static unsigned gcd(unsigned Dividend, unsigned Divisor) {
49 // Dividend and Divisor will be naturally swapped as needed.
Eugene Zelenko90d99202017-02-27 22:45:06 +000050 while (Divisor) {
Andrew Trick8d4abb22012-11-06 07:10:38 +000051 unsigned Rem = Dividend % Divisor;
52 Dividend = Divisor;
53 Divisor = Rem;
54 };
55 return Dividend;
56}
Eugene Zelenko90d99202017-02-27 22:45:06 +000057
Andrew Trick8d4abb22012-11-06 07:10:38 +000058static unsigned lcm(unsigned A, unsigned B) {
59 unsigned LCM = (uint64_t(A) * B) / gcd(A, B);
60 assert((LCM >= A && LCM >= B) && "LCM overflow");
61 return LCM;
62}
63
Sanjay Patele599cea2018-04-08 19:56:04 +000064void TargetSchedModel::init(const TargetSubtargetInfo *TSInfo) {
65 STI = TSInfo;
66 SchedModel = TSInfo->getSchedModel();
67 TII = TSInfo->getInstrInfo();
Andrew Trick99ab6c62012-09-14 20:26:46 +000068 STI->initInstrItins(InstrItins);
Andrew Trick8d4abb22012-11-06 07:10:38 +000069
70 unsigned NumRes = SchedModel.getNumProcResourceKinds();
71 ResourceFactors.resize(NumRes);
72 ResourceLCM = SchedModel.IssueWidth;
73 for (unsigned Idx = 0; Idx < NumRes; ++Idx) {
74 unsigned NumUnits = SchedModel.getProcResource(Idx)->NumUnits;
75 if (NumUnits > 0)
76 ResourceLCM = lcm(ResourceLCM, NumUnits);
77 }
78 MicroOpFactor = ResourceLCM / SchedModel.IssueWidth;
79 for (unsigned Idx = 0; Idx < NumRes; ++Idx) {
80 unsigned NumUnits = SchedModel.getProcResource(Idx)->NumUnits;
81 ResourceFactors[Idx] = NumUnits ? (ResourceLCM / NumUnits) : 0;
82 }
Andrew Trick99ab6c62012-09-14 20:26:46 +000083}
Andrew Trick34301ce2012-09-18 04:03:34 +000084
Javed Absar47652292017-03-27 20:46:37 +000085/// Returns true only if instruction is specified as single issue.
86bool TargetSchedModel::mustBeginGroup(const MachineInstr *MI,
87 const MCSchedClassDesc *SC) const {
88 if (hasInstrSchedModel()) {
89 if (!SC)
90 SC = resolveSchedClass(MI);
91 if (SC->isValid())
92 return SC->BeginGroup;
93 }
94 return false;
95}
96
97bool TargetSchedModel::mustEndGroup(const MachineInstr *MI,
98 const MCSchedClassDesc *SC) const {
99 if (hasInstrSchedModel()) {
100 if (!SC)
101 SC = resolveSchedClass(MI);
102 if (SC->isValid())
103 return SC->EndGroup;
104 }
105 return false;
106}
107
Andrew Trick8d4abb22012-11-06 07:10:38 +0000108unsigned TargetSchedModel::getNumMicroOps(const MachineInstr *MI,
109 const MCSchedClassDesc *SC) const {
Andrew Trick412cd2f2012-10-10 05:43:09 +0000110 if (hasInstrItineraries()) {
111 int UOps = InstrItins.getNumMicroOps(MI->getDesc().getSchedClass());
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000112 return (UOps >= 0) ? UOps : TII->getNumMicroOps(&InstrItins, *MI);
Andrew Trick412cd2f2012-10-10 05:43:09 +0000113 }
Andrew Trick4903c152012-10-11 05:37:06 +0000114 if (hasInstrSchedModel()) {
Andrew Trick8d4abb22012-11-06 07:10:38 +0000115 if (!SC)
116 SC = resolveSchedClass(MI);
117 if (SC->isValid())
118 return SC->NumMicroOps;
Andrew Trick4903c152012-10-11 05:37:06 +0000119 }
120 return MI->isTransient() ? 0 : 1;
Andrew Trick412cd2f2012-10-10 05:43:09 +0000121}
122
Andrew Trickfdd6fa82012-10-17 17:27:10 +0000123// The machine model may explicitly specify an invalid latency, which
124// effectively means infinite latency. Since users of the TargetSchedule API
125// don't know how to handle this, we convert it to a very large latency that is
126// easy to distinguish when debugging the DAG but won't induce overflow.
Andrew Trickb86a0cd2013-06-15 04:49:57 +0000127static unsigned capLatency(int Cycles) {
Andrew Trickfdd6fa82012-10-17 17:27:10 +0000128 return Cycles >= 0 ? Cycles : 1000;
129}
130
Andrew Trick34301ce2012-09-18 04:03:34 +0000131/// Return the MCSchedClassDesc for this instruction. Some SchedClasses require
132/// evaluation of predicates that depend on instruction operands or flags.
133const MCSchedClassDesc *TargetSchedModel::
134resolveSchedClass(const MachineInstr *MI) const {
Andrew Trick34301ce2012-09-18 04:03:34 +0000135 // Get the definition's scheduling class descriptor from this machine model.
136 unsigned SchedClass = MI->getDesc().getSchedClass();
137 const MCSchedClassDesc *SCDesc = SchedModel.getSchedClassDesc(SchedClass);
Andrew Trick6a22dba2013-04-13 06:07:45 +0000138 if (!SCDesc->isValid())
139 return SCDesc;
Andrew Trick34301ce2012-09-18 04:03:34 +0000140
141#ifndef NDEBUG
142 unsigned NIter = 0;
143#endif
144 while (SCDesc->isVariant()) {
145 assert(++NIter < 6 && "Variants are nested deeper than the magic number");
146
147 SchedClass = STI->resolveSchedClass(SchedClass, MI, this);
148 SCDesc = SchedModel.getSchedClassDesc(SchedClass);
149 }
150 return SCDesc;
151}
152
153/// Find the def index of this operand. This index maps to the machine model and
154/// is independent of use operands. Def operands may be reordered with uses or
155/// merged with uses without affecting the def index (e.g. before/after
156/// regalloc). However, an instruction's def operands must never be reordered
157/// with respect to each other.
158static unsigned findDefIdx(const MachineInstr *MI, unsigned DefOperIdx) {
159 unsigned DefIdx = 0;
160 for (unsigned i = 0; i != DefOperIdx; ++i) {
161 const MachineOperand &MO = MI->getOperand(i);
162 if (MO.isReg() && MO.isDef())
163 ++DefIdx;
164 }
165 return DefIdx;
166}
167
168/// Find the use index of this operand. This is independent of the instruction's
169/// def operands.
Andrew Trick3918cad2012-09-18 18:20:02 +0000170///
171/// Note that uses are not determined by the operand's isUse property, which
172/// is simply the inverse of isDef. Here we consider any readsReg operand to be
173/// a "use". The machine model allows an operand to be both a Def and Use.
Andrew Trick34301ce2012-09-18 04:03:34 +0000174static unsigned findUseIdx(const MachineInstr *MI, unsigned UseOperIdx) {
175 unsigned UseIdx = 0;
176 for (unsigned i = 0; i != UseOperIdx; ++i) {
177 const MachineOperand &MO = MI->getOperand(i);
Matthias Braunfb335522016-08-24 02:32:29 +0000178 if (MO.isReg() && MO.readsReg() && !MO.isDef())
Andrew Trick34301ce2012-09-18 04:03:34 +0000179 ++UseIdx;
180 }
181 return UseIdx;
182}
183
184// Top-level API for clients that know the operand indices.
185unsigned TargetSchedModel::computeOperandLatency(
186 const MachineInstr *DefMI, unsigned DefOperIdx,
Andrew Trickb86a0cd2013-06-15 04:49:57 +0000187 const MachineInstr *UseMI, unsigned UseOperIdx) const {
Andrew Trick34301ce2012-09-18 04:03:34 +0000188
Andrew Trickb86a0cd2013-06-15 04:49:57 +0000189 if (!hasInstrSchedModel() && !hasInstrItineraries())
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000190 return TII->defaultDefLatency(SchedModel, *DefMI);
Andrew Trick34301ce2012-09-18 04:03:34 +0000191
Andrew Trick42bb1062012-10-09 23:44:26 +0000192 if (hasInstrItineraries()) {
Andrew Trick72fd0a92012-10-04 00:24:34 +0000193 int OperLatency = 0;
194 if (UseMI) {
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000195 OperLatency = TII->getOperandLatency(&InstrItins, *DefMI, DefOperIdx,
196 *UseMI, UseOperIdx);
Andrew Trick34301ce2012-09-18 04:03:34 +0000197 }
Andrew Trick72fd0a92012-10-04 00:24:34 +0000198 else {
199 unsigned DefClass = DefMI->getDesc().getSchedClass();
200 OperLatency = InstrItins.getOperandCycle(DefClass, DefOperIdx);
201 }
202 if (OperLatency >= 0)
203 return OperLatency;
204
205 // No operand latency was found.
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000206 unsigned InstrLatency = TII->getInstrLatency(&InstrItins, *DefMI);
Andrew Trick72fd0a92012-10-04 00:24:34 +0000207
208 // Expected latency is the max of the stage latency and itinerary props.
Andrew Trickc0dfffa2012-10-09 23:44:32 +0000209 // Rather than directly querying InstrItins stage latency, we call a TII
210 // hook to allow subtargets to specialize latency. This hook is only
211 // applicable to the InstrItins model. InstrSchedModel should model all
212 // special cases without TII hooks.
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000213 InstrLatency =
214 std::max(InstrLatency, TII->defaultDefLatency(SchedModel, *DefMI));
Andrew Trick72fd0a92012-10-04 00:24:34 +0000215 return InstrLatency;
216 }
Andrew Trickb86a0cd2013-06-15 04:49:57 +0000217 // hasInstrSchedModel()
Andrew Trick72fd0a92012-10-04 00:24:34 +0000218 const MCSchedClassDesc *SCDesc = resolveSchedClass(DefMI);
219 unsigned DefIdx = findDefIdx(DefMI, DefOperIdx);
220 if (DefIdx < SCDesc->NumWriteLatencyEntries) {
221 // Lookup the definition's write latency in SubtargetInfo.
222 const MCWriteLatencyEntry *WLEntry =
223 STI->getWriteLatencyEntry(SCDesc, DefIdx);
224 unsigned WriteID = WLEntry->WriteResourceID;
Andrew Trickb86a0cd2013-06-15 04:49:57 +0000225 unsigned Latency = capLatency(WLEntry->Cycles);
Andrew Trick72fd0a92012-10-04 00:24:34 +0000226 if (!UseMI)
227 return Latency;
228
229 // Lookup the use's latency adjustment in SubtargetInfo.
230 const MCSchedClassDesc *UseDesc = resolveSchedClass(UseMI);
231 if (UseDesc->NumReadAdvanceEntries == 0)
232 return Latency;
233 unsigned UseIdx = findUseIdx(UseMI, UseOperIdx);
Andrew Trick71b9d942013-06-17 21:45:18 +0000234 int Advance = STI->getReadAdvanceCycles(UseDesc, UseIdx, WriteID);
235 if (Advance > 0 && (unsigned)Advance > Latency) // unsigned wrap
236 return 0;
237 return Latency - Advance;
Andrew Trick72fd0a92012-10-04 00:24:34 +0000238 }
239 // If DefIdx does not exist in the model (e.g. implicit defs), then return
240 // unit latency (defaultDefLatency may be too conservative).
Andrew Trick3918cad2012-09-18 18:20:02 +0000241#ifndef NDEBUG
Andrew Trick72fd0a92012-10-04 00:24:34 +0000242 if (SCDesc->isValid() && !DefMI->getOperand(DefOperIdx).isImplicit()
Andrew Trick07015642013-09-25 18:14:12 +0000243 && !DefMI->getDesc().OpInfo[DefOperIdx].isOptionalDef()
244 && SchedModel.isComplete()) {
Matthias Braun63f73d72015-07-17 17:50:11 +0000245 errs() << "DefIdx " << DefIdx << " exceeds machine model writes for "
MinSeong Kim9ec37632016-01-05 14:50:15 +0000246 << *DefMI << " (Try with MCSchedModel.CompleteModel set to false)";
Matthias Braun63f73d72015-07-17 17:50:11 +0000247 llvm_unreachable("incomplete machine model");
Andrew Trick72fd0a92012-10-04 00:24:34 +0000248 }
Andrew Trick3918cad2012-09-18 18:20:02 +0000249#endif
Andrew Trick51f67472013-03-16 18:58:57 +0000250 // FIXME: Automatically giving all implicit defs defaultDefLatency is
251 // undesirable. We should only do it for defs that are known to the MC
252 // desc like flags. Truly implicit defs should get 1 cycle latency.
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000253 return DefMI->isTransient() ? 0 : TII->defaultDefLatency(SchedModel, *DefMI);
Andrew Trick34301ce2012-09-18 04:03:34 +0000254}
Andrew Trickc0dfffa2012-10-09 23:44:32 +0000255
Matthias Braunbe4ab8d2015-05-14 18:01:13 +0000256unsigned
257TargetSchedModel::computeInstrLatency(const MCSchedClassDesc &SCDesc) const {
Andrea Di Biagiofe3b1d22018-03-13 15:22:13 +0000258 return capLatency(MCSchedModel::computeInstrLatency(*STI, SCDesc));
Matthias Braunbe4ab8d2015-05-14 18:01:13 +0000259}
260
Gerolf Hoflehnerb0b70882014-08-03 21:35:39 +0000261unsigned TargetSchedModel::computeInstrLatency(unsigned Opcode) const {
262 assert(hasInstrSchedModel() && "Only call this function with a SchedModel");
Gerolf Hoflehnerb0b70882014-08-03 21:35:39 +0000263 unsigned SCIdx = TII->get(Opcode).getSchedClass();
Andrea Di Biagioae5fb652018-05-31 13:30:42 +0000264 return capLatency(SchedModel.computeInstrLatency(*STI, SCIdx));
265}
266
267unsigned TargetSchedModel::computeInstrLatency(const MCInst &Inst) const {
268 if (hasInstrSchedModel())
269 return capLatency(SchedModel.computeInstrLatency(*STI, *TII, Inst));
270 return computeInstrLatency(Inst.getOpcode());
Gerolf Hoflehnerb0b70882014-08-03 21:35:39 +0000271}
272
Arnold Schwaighoferd42730d2013-09-30 15:28:56 +0000273unsigned
274TargetSchedModel::computeInstrLatency(const MachineInstr *MI,
275 bool UseDefaultDefLatency) const {
Andrew Trick82d46ae2012-10-10 05:43:18 +0000276 // For the itinerary model, fall back to the old subtarget hook.
277 // Allow subtargets to compute Bundle latencies outside the machine model.
Arnold Schwaighoferd42730d2013-09-30 15:28:56 +0000278 if (hasInstrItineraries() || MI->isBundle() ||
279 (!hasInstrSchedModel() && !UseDefaultDefLatency))
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000280 return TII->getInstrLatency(&InstrItins, *MI);
Andrew Trick82d46ae2012-10-10 05:43:18 +0000281
Andrew Trickc0dfffa2012-10-09 23:44:32 +0000282 if (hasInstrSchedModel()) {
Andrew Trickc0dfffa2012-10-09 23:44:32 +0000283 const MCSchedClassDesc *SCDesc = resolveSchedClass(MI);
Matthias Braunbe4ab8d2015-05-14 18:01:13 +0000284 if (SCDesc->isValid())
285 return computeInstrLatency(*SCDesc);
Andrew Trickc0dfffa2012-10-09 23:44:32 +0000286 }
Duncan P. N. Exon Smith567409d2016-06-30 00:01:54 +0000287 return TII->defaultDefLatency(SchedModel, *MI);
Andrew Trickc0dfffa2012-10-09 23:44:32 +0000288}
Andrew Trick412cd2f2012-10-10 05:43:09 +0000289
290unsigned TargetSchedModel::
291computeOutputLatency(const MachineInstr *DefMI, unsigned DefOperIdx,
292 const MachineInstr *DepMI) const {
Junmo Park9200ab32016-06-21 08:09:58 +0000293 if (!SchedModel.isOutOfOrder())
Andrew Trick412cd2f2012-10-10 05:43:09 +0000294 return 1;
295
Junmo Park9200ab32016-06-21 08:09:58 +0000296 // Out-of-order processor can dispatch WAW dependencies in the same cycle.
Andrew Trick412cd2f2012-10-10 05:43:09 +0000297
298 // Treat predication as a data dependency for out-of-order cpus. In-order
299 // cpus do not need to treat predicated writes specially.
300 //
301 // TODO: The following hack exists because predication passes do not
302 // correctly append imp-use operands, and readsReg() strangely returns false
303 // for predicated defs.
304 unsigned Reg = DefMI->getOperand(DefOperIdx).getReg();
Justin Bogner1842f4a2017-10-10 23:50:49 +0000305 const MachineFunction &MF = *DefMI->getMF();
Eric Christopher60355182014-08-05 02:39:49 +0000306 const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
Duncan P. N. Exon Smith5b9b80e2016-02-23 02:46:52 +0000307 if (!DepMI->readsRegister(Reg, TRI) && TII->isPredicated(*DepMI))
Andrew Trick412cd2f2012-10-10 05:43:09 +0000308 return computeInstrLatency(DefMI);
309
310 // If we have a per operand scheduling model, check if this def is writing
311 // an unbuffered resource. If so, it treated like an in-order cpu.
312 if (hasInstrSchedModel()) {
313 const MCSchedClassDesc *SCDesc = resolveSchedClass(DefMI);
Andrew Trick4903c152012-10-11 05:37:06 +0000314 if (SCDesc->isValid()) {
315 for (const MCWriteProcResEntry *PRI = STI->getWriteProcResBegin(SCDesc),
316 *PRE = STI->getWriteProcResEnd(SCDesc); PRI != PRE; ++PRI) {
Andrew Trickb86a0cd2013-06-15 04:49:57 +0000317 if (!SchedModel.getProcResource(PRI->ProcResourceIdx)->BufferSize)
Andrew Trick4903c152012-10-11 05:37:06 +0000318 return 1;
319 }
Andrew Trick412cd2f2012-10-10 05:43:09 +0000320 }
321 }
322 return 0;
323}
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000324
Sanjay Patel863443f2018-06-05 23:34:45 +0000325double
Andrea Di Biagiob5e23d12018-04-15 17:32:17 +0000326TargetSchedModel::computeReciprocalThroughput(const MachineInstr *MI) const {
327 if (hasInstrItineraries()) {
328 unsigned SchedClass = MI->getDesc().getSchedClass();
329 return MCSchedModel::getReciprocalThroughput(SchedClass,
330 *getInstrItineraries());
331 }
332
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000333 if (hasInstrSchedModel())
Andrea Di Biagio0718ccc2018-03-13 16:28:55 +0000334 return MCSchedModel::getReciprocalThroughput(*STI, *resolveSchedClass(MI));
Sanjay Patel863443f2018-06-05 23:34:45 +0000335
336 return 0.0;
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000337}
338
Sanjay Patel863443f2018-06-05 23:34:45 +0000339double
Andrea Di Biagiob5e23d12018-04-15 17:32:17 +0000340TargetSchedModel::computeReciprocalThroughput(unsigned Opcode) const {
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000341 unsigned SchedClass = TII->get(Opcode).getSchedClass();
342 if (hasInstrItineraries())
Andrea Di Biagiob5e23d12018-04-15 17:32:17 +0000343 return MCSchedModel::getReciprocalThroughput(SchedClass,
344 *getInstrItineraries());
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000345 if (hasInstrSchedModel()) {
Andrea Di Biagio0718ccc2018-03-13 16:28:55 +0000346 const MCSchedClassDesc &SCDesc = *SchedModel.getSchedClassDesc(SchedClass);
347 if (SCDesc.isValid() && !SCDesc.isVariant())
348 return MCSchedModel::getReciprocalThroughput(*STI, SCDesc);
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000349 }
Sanjay Patel863443f2018-06-05 23:34:45 +0000350
351 return 0.0;
Andrew V. Tischenko37965612017-04-14 07:44:23 +0000352}
Andrea Di Biagioae5fb652018-05-31 13:30:42 +0000353
Sanjay Patel863443f2018-06-05 23:34:45 +0000354double
Andrea Di Biagioae5fb652018-05-31 13:30:42 +0000355TargetSchedModel::computeReciprocalThroughput(const MCInst &MI) const {
356 if (hasInstrSchedModel())
357 return SchedModel.getReciprocalThroughput(*STI, *TII, MI);
358 return computeReciprocalThroughput(MI.getOpcode());
359}
360