1 //===-- PPCScheduleE500mc.td - e500mc Scheduling Defs ------*- tablegen -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines the itinerary class data for the Freescale e500mc 32-bit
13 // All information is derived from the "e500mc Core Reference Manual",
14 // Freescale Document Number E500MCRM, Rev. 1, 03/2012.
16 //===----------------------------------------------------------------------===//
17 // Relevant functional units in the Freescale e500mc core:
19 // * Decode & Dispatch
20 // Can dispatch up to 2 instructions per clock cycle to either the GPR Issue
21 // queues (GIQx), FP Issue Queue (FIQ), or Branch issue queue (BIQ).
22 def E500_DIS0 : FuncUnit; // Dispatch stage - insn 1
23 def E500_DIS1 : FuncUnit; // Dispatch stage - insn 2
26 // 6 pipelined execution units: SFX0, SFX1, BU, FPU, LSU, CFX.
27 // Some instructions can only execute in SFX0 but not SFX1.
28 // The CFX has a bypass path, allowing non-divide instructions to execute
29 // while a divide instruction is executed.
30 def E500_SFX0 : FuncUnit; // Simple unit 0
31 def E500_SFX1 : FuncUnit; // Simple unit 1
32 def E500_BU : FuncUnit; // Branch unit
33 def E500_CFX_DivBypass
34 : FuncUnit; // CFX divide bypass path
35 def E500_CFX_0 : FuncUnit; // CFX pipeline
36 def E500_LSU_0 : FuncUnit; // LSU pipeline
37 def E500_FPU_0 : FuncUnit; // FPU pipeline
39 def E500_GPR_Bypass : Bypass;
40 def E500_FPR_Bypass : Bypass;
41 def E500_CR_Bypass : Bypass;
43 def PPCE500mcItineraries : ProcessorItineraries<
44 [E500_DIS0, E500_DIS1, E500_SFX0, E500_SFX1, E500_BU, E500_CFX_DivBypass,
45 E500_CFX_0, E500_LSU_0, E500_FPU_0],
46 [E500_CR_Bypass, E500_GPR_Bypass, E500_FPR_Bypass], [
47 InstrItinData<IIC_IntSimple, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
48 InstrStage<1, [E500_SFX0, E500_SFX1]>],
49 [4, 1, 1], // Latency = 1
51 E500_GPR_Bypass, E500_GPR_Bypass]>,
52 InstrItinData<IIC_IntGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
53 InstrStage<1, [E500_SFX0, E500_SFX1]>],
54 [4, 1, 1], // Latency = 1
56 E500_GPR_Bypass, E500_GPR_Bypass]>,
57 InstrItinData<IIC_IntCompare, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
58 InstrStage<1, [E500_SFX0, E500_SFX1]>],
59 [5, 1, 1], // Latency = 1 or 2
61 E500_GPR_Bypass, E500_GPR_Bypass]>,
62 InstrItinData<IIC_IntDivW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
63 InstrStage<1, [E500_CFX_0], 0>,
64 InstrStage<14, [E500_CFX_DivBypass]>],
65 [17, 1, 1], // Latency=4..35, Repeat= 4..35
67 E500_GPR_Bypass, E500_GPR_Bypass]>,
68 InstrItinData<IIC_IntMFFS, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
69 InstrStage<8, [E500_FPU_0]>],
72 InstrItinData<IIC_IntMTFSB0, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
73 InstrStage<8, [E500_FPU_0]>],
74 [11, 1, 1], // Latency = 8
75 [NoBypass, NoBypass, NoBypass]>,
76 InstrItinData<IIC_IntMulHW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
77 InstrStage<1, [E500_CFX_0]>],
78 [7, 1, 1], // Latency = 4, Repeat rate = 1
80 E500_GPR_Bypass, E500_GPR_Bypass]>,
81 InstrItinData<IIC_IntMulHWU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
82 InstrStage<1, [E500_CFX_0]>],
83 [7, 1, 1], // Latency = 4, Repeat rate = 1
85 E500_GPR_Bypass, E500_GPR_Bypass]>,
86 InstrItinData<IIC_IntMulLI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
87 InstrStage<1, [E500_CFX_0]>],
88 [7, 1, 1], // Latency = 4, Repeat rate = 1
90 E500_GPR_Bypass, E500_GPR_Bypass]>,
91 InstrItinData<IIC_IntRotate, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
92 InstrStage<1, [E500_SFX0, E500_SFX1]>],
93 [4, 1, 1], // Latency = 1
95 E500_GPR_Bypass, E500_GPR_Bypass]>,
96 InstrItinData<IIC_IntShift, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
97 InstrStage<1, [E500_SFX0, E500_SFX1]>],
98 [4, 1, 1], // Latency = 1
100 E500_GPR_Bypass, E500_GPR_Bypass]>,
101 InstrItinData<IIC_IntTrapW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
102 InstrStage<2, [E500_SFX0]>],
103 [5, 1], // Latency = 2, Repeat rate = 2
104 [E500_GPR_Bypass, E500_GPR_Bypass]>,
105 InstrItinData<IIC_BrB, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
106 InstrStage<1, [E500_BU]>],
107 [4, 1], // Latency = 1
108 [NoBypass, E500_GPR_Bypass]>,
109 InstrItinData<IIC_BrCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
110 InstrStage<1, [E500_BU]>],
111 [4, 1, 1], // Latency = 1
113 E500_CR_Bypass, E500_CR_Bypass]>,
114 InstrItinData<IIC_BrMCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
115 InstrStage<1, [E500_BU]>],
116 [4, 1], // Latency = 1
117 [E500_CR_Bypass, E500_CR_Bypass]>,
118 InstrItinData<IIC_BrMCRX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
119 InstrStage<1, [E500_SFX0, E500_SFX1]>],
120 [4, 1, 1], // Latency = 1
121 [E500_CR_Bypass, E500_GPR_Bypass]>,
122 InstrItinData<IIC_LdStDCBA, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
123 InstrStage<1, [E500_LSU_0]>],
124 [6, 1], // Latency = 3, Repeat rate = 1
125 [E500_GPR_Bypass, E500_GPR_Bypass]>,
126 InstrItinData<IIC_LdStDCBF, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
127 InstrStage<1, [E500_LSU_0]>],
128 [6, 1], // Latency = 3
129 [E500_GPR_Bypass, E500_GPR_Bypass]>,
130 InstrItinData<IIC_LdStDCBI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
131 InstrStage<1, [E500_LSU_0]>],
132 [6, 1], // Latency = 3
133 [E500_GPR_Bypass, E500_GPR_Bypass]>,
134 InstrItinData<IIC_LdStLoad, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
135 InstrStage<1, [E500_LSU_0]>],
136 [6, 1], // Latency = 3
137 [E500_GPR_Bypass, E500_GPR_Bypass]>,
138 InstrItinData<IIC_LdStLoadUpd, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
139 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
140 InstrStage<1, [E500_LSU_0]>],
141 [6, 1], // Latency = 3
142 [E500_GPR_Bypass, E500_GPR_Bypass],
144 InstrItinData<IIC_LdStStore, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
145 InstrStage<1, [E500_LSU_0]>],
146 [6, 1], // Latency = 3
147 [NoBypass, E500_GPR_Bypass]>,
148 InstrItinData<IIC_LdStStoreUpd,[InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
149 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
150 InstrStage<1, [E500_LSU_0]>],
151 [6, 1], // Latency = 3
152 [NoBypass, E500_GPR_Bypass],
154 InstrItinData<IIC_LdStICBI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
155 InstrStage<1, [E500_LSU_0]>],
156 [6, 1], // Latency = 3
157 [NoBypass, E500_GPR_Bypass]>,
158 InstrItinData<IIC_LdStSTFD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
159 InstrStage<1, [E500_LSU_0]>],
160 [6, 1, 1], // Latency = 3
162 E500_GPR_Bypass, E500_GPR_Bypass]>,
163 InstrItinData<IIC_LdStSTFDU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
164 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
165 InstrStage<1, [E500_LSU_0]>],
166 [6, 1, 1], // Latency = 3
168 E500_GPR_Bypass, E500_GPR_Bypass],
170 InstrItinData<IIC_LdStLFD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
171 InstrStage<1, [E500_LSU_0]>],
172 [7, 1, 1], // Latency = 4
174 E500_GPR_Bypass, E500_GPR_Bypass]>,
175 InstrItinData<IIC_LdStLFDU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
176 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
177 InstrStage<1, [E500_LSU_0]>],
178 [7, 1, 1], // Latency = 4
180 E500_GPR_Bypass, E500_GPR_Bypass],
182 InstrItinData<IIC_LdStLHA, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
183 InstrStage<1, [E500_LSU_0]>],
184 [6, 1], // Latency = 3
185 [E500_GPR_Bypass, E500_GPR_Bypass]>,
186 InstrItinData<IIC_LdStLHAU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
187 InstrStage<1, [E500_SFX0, E500_SFX1], 0>,
188 InstrStage<1, [E500_LSU_0]>],
189 [6, 1], // Latency = 3
190 [E500_GPR_Bypass, E500_GPR_Bypass]>,
191 InstrItinData<IIC_LdStLMW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
192 InstrStage<1, [E500_LSU_0]>],
193 [7, 1], // Latency = r+3
194 [NoBypass, E500_GPR_Bypass]>,
195 InstrItinData<IIC_LdStLWARX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
196 InstrStage<3, [E500_LSU_0]>],
197 [6, 1, 1], // Latency = 3, Repeat rate = 3
199 E500_GPR_Bypass, E500_GPR_Bypass]>,
200 InstrItinData<IIC_LdStSTWCX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
201 InstrStage<1, [E500_LSU_0]>],
202 [6, 1], // Latency = 3
203 [NoBypass, E500_GPR_Bypass]>,
204 InstrItinData<IIC_LdStSync, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
205 InstrStage<1, [E500_LSU_0]>]>,
206 InstrItinData<IIC_SprMFSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
207 InstrStage<4, [E500_SFX0]>],
209 [E500_GPR_Bypass, E500_GPR_Bypass]>,
210 InstrItinData<IIC_SprMTMSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
211 InstrStage<2, [E500_SFX0, E500_SFX1]>],
212 [5, 1], // Latency = 2, Repeat rate = 4
213 [E500_GPR_Bypass, E500_GPR_Bypass]>,
214 InstrItinData<IIC_SprMTSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
215 InstrStage<1, [E500_SFX0]>],
217 [NoBypass, E500_GPR_Bypass]>,
218 InstrItinData<IIC_SprTLBSYNC, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
219 InstrStage<1, [E500_LSU_0], 0>]>,
220 InstrItinData<IIC_SprMFCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
221 InstrStage<5, [E500_SFX0]>],
223 [E500_GPR_Bypass, E500_CR_Bypass]>,
224 InstrItinData<IIC_SprMFMSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
225 InstrStage<4, [E500_SFX0]>],
226 [7, 1], // Latency = 4, Repeat rate = 4
227 [E500_GPR_Bypass, E500_GPR_Bypass]>,
228 InstrItinData<IIC_SprMFSPR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
229 InstrStage<1, [E500_SFX0, E500_SFX1]>],
230 [4, 1], // Latency = 1, Repeat rate = 1
231 [E500_GPR_Bypass, E500_CR_Bypass]>,
232 InstrItinData<IIC_SprMFTB, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
233 InstrStage<4, [E500_SFX0]>],
234 [7, 1], // Latency = 4, Repeat rate = 4
235 [NoBypass, E500_GPR_Bypass]>,
236 InstrItinData<IIC_SprMTSPR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
237 InstrStage<1, [E500_SFX0, E500_SFX1]>],
238 [4, 1], // Latency = 1, Repeat rate = 1
239 [E500_CR_Bypass, E500_GPR_Bypass]>,
240 InstrItinData<IIC_SprMTSRIN, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
241 InstrStage<1, [E500_SFX0]>],
243 [NoBypass, E500_GPR_Bypass]>,
244 InstrItinData<IIC_FPGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
245 InstrStage<2, [E500_FPU_0]>],
246 [11, 1, 1], // Latency = 8, Repeat rate = 2
248 E500_FPR_Bypass, E500_FPR_Bypass]>,
249 InstrItinData<IIC_FPAddSub, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
250 InstrStage<4, [E500_FPU_0]>],
251 [13, 1, 1], // Latency = 10, Repeat rate = 4
253 E500_FPR_Bypass, E500_FPR_Bypass]>,
254 InstrItinData<IIC_FPCompare, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
255 InstrStage<2, [E500_FPU_0]>],
256 [11, 1, 1], // Latency = 8, Repeat rate = 2
258 E500_FPR_Bypass, E500_FPR_Bypass]>,
259 InstrItinData<IIC_FPDivD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
260 InstrStage<68, [E500_FPU_0]>],
261 [71, 1, 1], // Latency = 68, Repeat rate = 68
263 E500_FPR_Bypass, E500_FPR_Bypass]>,
264 InstrItinData<IIC_FPDivS, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
265 InstrStage<38, [E500_FPU_0]>],
266 [41, 1, 1], // Latency = 38, Repeat rate = 38
268 E500_FPR_Bypass, E500_FPR_Bypass]>,
269 InstrItinData<IIC_FPFused, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
270 InstrStage<4, [E500_FPU_0]>],
271 [13, 1, 1, 1], // Latency = 10, Repeat rate = 4
273 E500_FPR_Bypass, E500_FPR_Bypass,
275 InstrItinData<IIC_FPRes, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
276 InstrStage<38, [E500_FPU_0]>],
277 [41, 1], // Latency = 38, Repeat rate = 38
278 [E500_FPR_Bypass, E500_FPR_Bypass]>
281 // ===---------------------------------------------------------------------===//
282 // e500mc machine model for scheduling and other instruction cost heuristics.
284 def PPCE500mcModel : SchedMachineModel {
285 let IssueWidth = 2; // 2 micro-ops are dispatched per cycle.
286 let MinLatency = -1; // OperandCycles are interpreted as MinLatency.
287 let LoadLatency = 5; // Optimistic load latency assuming bypass.
288 // This is overriden by OperandCycles if the
289 // Itineraries are queried instead.
291 let Itineraries = PPCE500mcItineraries;