1//==- MipsScheduleP5600.td - P5600 Scheduling Definitions --*- tablegen -*-===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10def MipsP5600Model : SchedMachineModel {
11  int IssueWidth = 2; // 2x dispatched per cycle
12  int MicroOpBufferSize = 48; // min(48, 48, 64)
13  int LoadLatency = 4;
14  int MispredictPenalty = 8; // TODO: Estimated
15
16  let CompleteModel = 0;
17}
18
19let SchedModel = MipsP5600Model in {
20
21// ALQ Pipelines
22// =============
23
24def P5600ALQ : ProcResource<1> { let BufferSize = 16; }
25def P5600IssueALU : ProcResource<1> { let Super = P5600ALQ; }
26
27// ALU Pipeline
28// ------------
29
30def P5600WriteALU : SchedWriteRes<[P5600IssueALU]>;
31
32// and, lui, nor, or, slti, sltiu, sub, subu, xor
33def : ItinRW<[P5600WriteALU],
34             [II_AND, II_LUI, II_NOR, II_OR, II_SLTI_SLTIU, II_SUBU, II_XOR]>;
35
36// AGQ Pipelines
37// =============
38
39def P5600AGQ : ProcResource<3> { let BufferSize = 16; }
40def P5600IssueAL2 : ProcResource<1> { let Super = P5600AGQ; }
41def P5600IssueCTISTD : ProcResource<1> { let Super = P5600AGQ; }
42def P5600IssueLDST : ProcResource<1> { let Super = P5600AGQ; }
43
44def P5600AL2Div : ProcResource<1>;
45// Pseudo-resource used to block CTISTD when handling multi-pipeline splits.
46def P5600CTISTD : ProcResource<1>;
47
48// CTISTD Pipeline
49// ---------------
50
51def P5600WriteJump : SchedWriteRes<[P5600IssueCTISTD, P5600CTISTD]>;
52def P5600WriteJumpAndLink : SchedWriteRes<[P5600IssueCTISTD, P5600CTISTD]> {
53  let Latency = 2;
54}
55
56// b, beq, beql, bg[et]z, bl[et]z, bne, bnel, j, syscall, jal, bltzal, jalx,
57// jalr, jr.hb, jr
58def : ItinRW<[P5600WriteJump], [II_B, II_BCC, II_BCCZ, II_BCCZAL, II_J, II_JR]>;
59def : ItinRW<[P5600WriteJumpAndLink], [II_JAL, II_JALR]>;
60
61// LDST Pipeline
62// -------------
63
64def P5600WriteLoad : SchedWriteRes<[P5600IssueLDST]> {
65  let Latency = 4;
66}
67
68def P5600WriteLoadShifted : SchedWriteRes<[P5600IssueLDST, P5600CTISTD]> {
69  let Latency = 4;
70}
71
72def P5600WritePref : SchedWriteRes<[P5600IssueLDST]>;
73
74def P5600WriteStore : SchedWriteRes<[P5600IssueLDST, P5600CTISTD]> {
75  // FIXME: This is a bit pessimistic. P5600CTISTD is only used during cycle 2
76  //        not during 0, 1, and 2.
77  let ResourceCycles = [ 1, 3 ];
78}
79
80def P5600WriteGPRFromBypass : SchedWriteRes<[P5600IssueLDST]> {
81  let Latency = 2;
82}
83
84def P5600WriteStoreFromOtherUnits : SchedWriteRes<[P5600IssueLDST]>;
85def P5600WriteLoadToOtherUnits : SchedWriteRes<[P5600IssueLDST]> {
86  let Latency = 0;
87}
88
89// l[bhw], l[bh]u, ll
90def : ItinRW<[P5600WriteLoad], [II_LB, II_LBU, II_LH, II_LHU, II_LW, II_LWU]>;
91
92// lw[lr]
93def : ItinRW<[P5600WriteLoadShifted], [II_LWL, II_LWR]>;
94
95// s[bhw], sw[lr]
96def : ItinRW<[P5600WriteStore], [II_SB, II_SH, II_SW, II_SWL, II_SWR]>;
97
98// pref
99// (this instruction does not exist in the backend yet)
100def : ItinRW<[P5600WritePref], []>;
101
102// sc
103// (this instruction does not exist in the backend yet)
104def : ItinRW<[P5600WriteStore], []>;
105
106// LDST is also used in moves from general purpose registers to floating point
107// and MSA.
108def P5600WriteMoveGPRToOtherUnits : SchedWriteRes<[P5600IssueLDST]> {
109  let Latency = 0;
110}
111
112// AL2 Pipeline
113// ------------
114
115def P5600WriteAL2 : SchedWriteRes<[P5600IssueAL2]>;
116def P5600WriteAL2BitExt : SchedWriteRes<[P5600IssueAL2]> { let Latency = 2; }
117def P5600WriteAL2ShadowMov : SchedWriteRes<[P5600IssueAL2]> { let Latency = 2; }
118def P5600WriteAL2CondMov : SchedWriteRes<[P5600IssueAL2, P5600CTISTD]> {
119  let Latency = 2;
120}
121def P5600WriteAL2Div : SchedWriteRes<[P5600IssueAL2, P5600AL2Div]> {
122  // Estimated worst case
123  let Latency = 34;
124  let ResourceCycles = [1, 34];
125}
126def P5600WriteAL2DivU : SchedWriteRes<[P5600IssueAL2, P5600AL2Div]> {
127  // Estimated worst case
128  let Latency = 34;
129  let ResourceCycles = [1, 34];
130}
131def P5600WriteAL2Mul : SchedWriteRes<[P5600IssueAL2]> { let Latency = 3; }
132def P5600WriteAL2Mult: SchedWriteRes<[P5600IssueAL2]> { let Latency = 5; }
133def P5600WriteAL2MAdd: SchedWriteRes<[P5600IssueAL2, P5600CTISTD]> {
134  let Latency = 5;
135}
136
137// clo, clz, di, mfhi, mflo
138def : ItinRW<[P5600WriteAL2], [II_CLO, II_CLZ, II_MFHI_MFLO]>;
139
140// ehb, rdhwr, rdpgpr, wrpgpr, wsbh
141def : ItinRW<[P5600WriteAL2ShadowMov], [II_RDHWR]>;
142
143// mov[nz]
144def : ItinRW<[P5600WriteAL2CondMov], [II_MOVN, II_MOVZ]>;
145
146// divu?
147def : ItinRW<[P5600WriteAL2Div], [II_DIV]>;
148def : ItinRW<[P5600WriteAL2DivU], [II_DIVU]>;
149
150// mul
151def : ItinRW<[P5600WriteAL2Mul], [II_MUL]>;
152// multu?, multu?
153def : ItinRW<[P5600WriteAL2Mult], [II_MULT, II_MULTU]>;
154// maddu?, msubu?, mthi, mtlo
155def : ItinRW<[P5600WriteAL2MAdd],
156             [II_MADD, II_MADDU, II_MSUB, II_MSUBU, II_MTHI_MTLO]>;
157
158// ext, ins
159def : ItinRW<[P5600WriteAL2BitExt],
160             [II_EXT, II_INS]>;
161
162// Either ALU or AL2 Pipelines
163// ---------------------------
164//
165// Some instructions can choose between ALU and AL2, but once dispatched to
166// ALQ or AGQ respectively they are committed to that path.
167// The decision is based on the outcome of the most recent selection when the
168// choice was last available. For now, we assume ALU is always chosen.
169
170def P5600WriteEitherALU : SchedWriteVariant<
171  // FIXME: Implement selection predicate
172  [SchedVar<SchedPredicate<[{1}]>, [P5600WriteALU]>,
173   SchedVar<SchedPredicate<[{0}]>, [P5600WriteAL2]>
174  ]>;
175
176// add, addi, addiu, addu, andi, ori, rotr, se[bh], sllv?, sr[al]v?, slt, sltu,
177// xori
178def : ItinRW<[P5600WriteEitherALU],
179             [II_ADDI, II_ADDIU, II_ANDI, II_ORI, II_ROTR, II_SEB, II_SEH,
180              II_SLT_SLTU, II_SLL, II_SRA, II_SRL, II_XORI, II_ADDU, II_SLLV,
181              II_SRAV, II_SRLV]>;
182
183// FPU Pipelines
184// =============
185
186def P5600FPQ : ProcResource<3> { let BufferSize = 16; }
187def P5600IssueFPUS : ProcResource<1> { let Super = P5600FPQ; }
188def P5600IssueFPUL : ProcResource<1> { let Super = P5600FPQ; }
189def P5600IssueFPULoad : ProcResource<1> { let Super = P5600FPQ; }
190
191def P5600FPUDivSqrt : ProcResource<2>;
192
193def P5600WriteFPUS : SchedWriteRes<[P5600IssueFPUS]>;
194def P5600WriteFPUL : SchedWriteRes<[P5600IssueFPUL]> { let Latency = 4; }
195def P5600WriteFPUL_MADDSUB : SchedWriteRes<[P5600IssueFPUL]> { let Latency = 6; }
196def P5600WriteFPUDivS : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
197  // Best/Common/Worst case = 7 / 23 / 27
198  let Latency = 23; // Using common case
199  let ResourceCycles = [ 1, 23 ];
200}
201def P5600WriteFPUDivD : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
202  // Best/Common/Worst case = 7 / 31 / 35
203  let Latency = 31; // Using common case
204  let ResourceCycles = [ 1, 31 ];
205}
206def P5600WriteFPURcpS : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
207  // Best/Common/Worst case = 7 / 19 / 23
208  let Latency = 19; // Using common case
209  let ResourceCycles = [ 1, 19 ];
210}
211def P5600WriteFPURcpD : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
212  // Best/Common/Worst case = 7 / 27 / 31
213  let Latency = 27; // Using common case
214  let ResourceCycles = [ 1, 27 ];
215}
216def P5600WriteFPURsqrtS : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
217  // Best/Common/Worst case = 7 / 27 / 27
218  let Latency = 27; // Using common case
219  let ResourceCycles = [ 1, 27 ];
220}
221def P5600WriteFPURsqrtD : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
222  // Best/Common/Worst case = 7 / 27 / 31
223  let Latency = 27; // Using common case
224  let ResourceCycles = [ 1, 27 ];
225}
226def P5600WriteFPUSqrtS : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
227  // Best/Common/Worst case = 7 / 27 / 31
228  let Latency = 27; // Using common case
229  let ResourceCycles = [ 1, 27 ];
230}
231def P5600WriteFPUSqrtD : SchedWriteRes<[P5600IssueFPUL, P5600FPUDivSqrt]> {
232  // Best/Common/Worst case = 7 / 35 / 39
233  let Latency = 35; // Using common case
234  let ResourceCycles = [ 1, 35 ];
235}
236def P5600WriteMSAShortLogic : SchedWriteRes<[P5600IssueFPUS]>;
237def P5600WriteMSAShortInt : SchedWriteRes<[P5600IssueFPUS]> { let Latency = 2; }
238def P5600WriteMoveOtherUnitsToFPU : SchedWriteRes<[P5600IssueFPUS]>;
239
240// FPUS is also used in moves from floating point and MSA registers to general
241// purpose registers.
242def P5600WriteMoveFPUSToOtherUnits : SchedWriteRes<[P5600IssueFPUS]> {
243  let Latency = 0;
244}
245
246// FPUL is also used in moves from floating point and MSA registers to general
247// purpose registers.
248def P5600WriteMoveFPULToOtherUnits : SchedWriteRes<[P5600IssueFPUL]>;
249
250// Short Pipe
251// ----------
252//
253// abs.[ds], abs.ps, bc1[tf]l?, mov[tf].[ds], mov[tf], mov.[ds], [cm][ft]c1,
254// m[ft]hc1, neg.[ds], neg.ps, nor.v, nori.b, or.v, ori.b, xor.v, xori.b,
255// sdxc1, sdc1, st.[bhwd], swc1, swxc1
256def : ItinRW<[P5600WriteFPUS], [II_ABS, II_MOVF_D, II_MOVF_S, II_MOVT_D,
257                                II_MOVT_S, II_MOV_D, II_MOV_S, II_NEG]>;
258
259// adds_a.[bhwd], adds_[asu].[bhwd], addvi?.[bhwd], asub_[us].[bhwd],
260// aver?_[us].[bhwd]
261def : InstRW<[P5600WriteMSAShortInt], (instregex "^ADD_A_[BHWD]$")>;
262def : InstRW<[P5600WriteMSAShortInt], (instregex "^ADDS_[ASU]_[BHWD]$")>;
263// TODO: ADDVI_[BHW] might be 1 cycle latency rather than 2. Need to confirm it.
264def : InstRW<[P5600WriteMSAShortInt], (instregex "^ADDVI?_[BHWD]$")>;
265def : InstRW<[P5600WriteMSAShortInt], (instregex "^ASUB_[US].[BHWD]$")>;
266def : InstRW<[P5600WriteMSAShortInt], (instregex "^AVER?_[US].[BHWD]$")>;
267
268// and.v, andi.b, move.v, ldi.[bhwd]
269def : InstRW<[P5600WriteMSAShortLogic], (instregex "^MOVE_V$")>;
270def : InstRW<[P5600WriteMSAShortLogic], (instregex "^LDI_[BHWD]$")>;
271def : InstRW<[P5600WriteMSAShortLogic], (instregex "^(AND|OR|[XN]OR)_V$")>;
272def : InstRW<[P5600WriteMSAShortLogic], (instregex "^(AND|OR|[XN]OR)I_B$")>;
273
274// Long Pipe
275// ----------
276//
277// add.[ds], add.ps, cvt.d.[sw], cvt.s.[dw], cvt.w.[sd], cvt.[sw].ps,
278// cvt.ps.[sw], c.<cc>.[ds], c.<cc>.ps, mul.[ds], mul.ps, sub.[ds], sub.ps,
279// trunc.w.[ds], trunc.w.ps
280def : ItinRW<[P5600WriteFPUL],
281             [II_ADD_D, II_ADD_S, II_CVT, II_C_CC_D, II_C_CC_S, II_MUL_D,
282              II_MUL_S, II_SUB_D, II_SUB_S, II_TRUNC]>;
283
284// div.[ds], div.ps
285def : ItinRW<[P5600WriteFPUDivS], [II_DIV_S]>;
286def : ItinRW<[P5600WriteFPUDivD], [II_DIV_D]>;
287
288// sqrt.[ds], sqrt.ps
289def : ItinRW<[P5600WriteFPUSqrtS], [II_SQRT_S]>;
290def : ItinRW<[P5600WriteFPUSqrtD], [II_SQRT_D]>;
291
292// madd.[ds], msub.[ds], nmadd.[ds], nmsub.[ds],
293// Operand 0 is read on cycle 5. All other operands are read on operand 0.
294def : ItinRW<[SchedReadAdvance<5>, P5600WriteFPUL_MADDSUB],
295             [II_MADD_D, II_MADD_S, II_MSUB_D, II_MSUB_S, II_NMADD_D,
296              II_NMADD_S, II_NMSUB_D, II_NMSUB_S]>;
297
298// madd.ps, msub.ps, nmadd.ps, nmsub.ps
299// Operand 0 and 1 are read on cycle 5. All others are read on operand 0.
300// (none of these instructions exist in the backend yet)
301
302// Load Pipe
303// ---------
304//
305// This is typically used in conjunction with the load pipeline under the AGQ
306// All the instructions are in the 'Tricky Instructions' section.
307
308def P5600WriteLoadOtherUnitsToFPU : SchedWriteRes<[P5600IssueFPULoad]> {
309  let Latency = 4;
310}
311
312// Tricky Instructions
313// ===================
314//
315// These instructions are split across multiple uops (in different pipelines)
316// that must cooperate to complete the operation
317
318// FIXME: This isn't quite right since the implementation of WriteSequence
319//        current aggregates the resources and ignores the exact cycle they are
320//        used.
321def P5600WriteMoveGPRToFPU : WriteSequence<[P5600WriteMoveGPRToOtherUnits,
322                                            P5600WriteMoveOtherUnitsToFPU]>;
323
324// FIXME: This isn't quite right since the implementation of WriteSequence
325//        current aggregates the resources and ignores the exact cycle they are
326//        used.
327def P5600WriteMoveFPUToGPR : WriteSequence<[P5600WriteMoveFPUSToOtherUnits,
328                                            P5600WriteGPRFromBypass]>;
329
330// FIXME: This isn't quite right since the implementation of WriteSequence
331//        current aggregates the resources and ignores the exact cycle they are
332//        used.
333def P5600WriteStoreFPUS : WriteSequence<[P5600WriteMoveFPUSToOtherUnits,
334                                         P5600WriteStoreFromOtherUnits]>;
335
336// FIXME: This isn't quite right since the implementation of WriteSequence
337//        current aggregates the resources and ignores the exact cycle they are
338//        used.
339def P5600WriteStoreFPUL : WriteSequence<[P5600WriteMoveFPULToOtherUnits,
340                                         P5600WriteStoreFromOtherUnits]>;
341
342// FIXME: This isn't quite right since the implementation of WriteSequence
343//        current aggregates the resources and ignores the exact cycle they are
344//        used.
345def P5600WriteLoadFPU : WriteSequence<[P5600WriteLoadToOtherUnits,
346                                       P5600WriteLoadOtherUnitsToFPU]>;
347
348// ctc1, mtc1, mthc1
349def : ItinRW<[P5600WriteMoveGPRToFPU], [II_CTC1, II_MTC1, II_MTHC1]>;
350
351// bc1[ft], cfc1, mfc1, mfhc1, movf, movt
352def : ItinRW<[P5600WriteMoveFPUToGPR],
353             [II_BC1F, II_BC1T, II_CFC1, II_MFC1, II_MFHC1, II_MOVF, II_MOVT]>;
354
355// swc1, swxc1, st.[bhwd]
356def : ItinRW<[P5600WriteStoreFPUS], [II_SWC1, II_SWXC1]>;
357def : InstRW<[P5600WriteStoreFPUS], (instregex "^ST_[BHWD]$")>;
358
359// movn.[ds], movz.[ds]
360def : ItinRW<[P5600WriteStoreFPUL], [II_MOVN_D, II_MOVN_S, II_MOVZ_D, II_MOVZ_S]>;
361
362// l[dw]x?c1, ld.[bhwd]
363def : ItinRW<[P5600WriteLoadFPU], [II_LDC1, II_LDXC1, II_LWC1, II_LWXC1]>;
364def : InstRW<[P5600WriteLoadFPU], (instregex "LD_[BHWD]")>;
365
366// Unsupported Instructions
367// ========================
368//
369// The following instruction classes are never valid on P5600.
370//   II_DADDIU, II_DADDU, II_DMFC1, II_DMTC1, II_DMULT, II_DMULTU, II_DROTR,
371//   II_DROTR32, II_DROTRV, II_DDIV, II_DSLL, II_DSLL32, II_DSLLV, II_DSRA,
372//   II_DSRA32, II_DSRAV, II_DSRL, II_DSRL32, II_DSRLV, II_DSUBU, II_DDIVU,
373//   II_JALRC, II_LD, II_LD[LR], II_LUXC1, II_RESTORE, II_SAVE, II_SD, II_SDC1,
374//   II_SDL, II_SDR, II_SDXC1
375//
376// The following instructions are never valid on P5600.
377//   addq.ph, rdhwr, repl.ph, repl.qb, subq.ph, subu_s.qb
378//
379// Guesswork
380// =========
381//
382// This section is largely temporary guesswork.
383
384// ceil.[lw].[ds], floor.[lw].[ds]
385// Reason behind guess: trunc.[lw].ds and the various cvt's are in FPUL
386def : ItinRW<[P5600WriteFPUL], [II_CEIL, II_FLOOR, II_ROUND]>;
387
388// rotrv
389// Reason behind guess: rotr is in the same category and the two register forms
390//                      generally follow the immediate forms in this category
391def : ItinRW<[P5600WriteEitherALU], [II_ROTRV]>;
392}
393