1 //===-- PPCScheduleE500.td - e500 Scheduling Defs ------*- tablegen -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines the itinerary class data for the Freescale e500 32-bit
13 // All information is derived from the "e500 Core Reference Manual",
14 // Freescale Document Number E500MCRM, Rev. 1, 03/2012.
16 //===----------------------------------------------------------------------===//
17 // Relevant functional units in the Freescale e500 core:
19 // * Decode & Dispatch
20 // Can dispatch up to 2 instructions per clock cycle to either the GPR Issue
21 // queues (GIQx) or Branch issue queue (BIQ).
22 def E500_DIS0 : FuncUnit; // Dispatch stage - insn 1
23 def E500_DIS1 : FuncUnit; // Dispatch stage - insn 2
26 // 6 pipelined execution units: SU0, SU1, BU, LSU, MU.
27 // Some instructions can only execute in SU0 but not SU1.
28 def E500_SU0 : FuncUnit; // Simple unit 0
29 def E500_SU1 : FuncUnit; // Simple unit 1
30 def E500_BU : FuncUnit; // Branch unit
31 def E500_MU : FuncUnit; // MU pipeline
32 def E500_LSU_0 : FuncUnit; // LSU pipeline
34 def E500_GPR_Bypass : Bypass;
35 def E500_CR_Bypass : Bypass;
36 def E500_DivBypass : Bypass;
38 def PPCE500Itineraries : ProcessorItineraries<
39 [E500_DIS0, E500_DIS1, E500_SU0, E500_SU1, E500_BU,
41 [E500_CR_Bypass, E500_GPR_Bypass, E500_DivBypass], [
42 InstrItinData<IIC_IntSimple, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
43 InstrStage<1, [E500_SU0, E500_SU1]>],
44 [4, 1, 1], // Latency = 1
46 E500_GPR_Bypass, E500_GPR_Bypass]>,
47 InstrItinData<IIC_IntGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
48 InstrStage<1, [E500_SU0, E500_SU1]>],
49 [4, 1, 1], // Latency = 1
51 E500_GPR_Bypass, E500_GPR_Bypass]>,
52 InstrItinData<IIC_IntISEL, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
53 InstrStage<1, [E500_SU0, E500_SU1]>],
54 [4, 1, 1, 1], // Latency = 1
56 E500_GPR_Bypass, E500_GPR_Bypass,
58 InstrItinData<IIC_IntCompare, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
59 InstrStage<1, [E500_SU0, E500_SU1]>],
60 [5, 1, 1], // Latency = 1 or 2
62 E500_GPR_Bypass, E500_GPR_Bypass]>,
63 InstrItinData<IIC_IntDivW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
64 InstrStage<1, [E500_MU], 0>,
65 InstrStage<14, [E500_MU]>],
66 [17, 1, 1], // Latency=4..35, Repeat= 4..35
68 E500_GPR_Bypass, E500_GPR_Bypass]>,
69 InstrItinData<IIC_IntMulHW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
70 InstrStage<4, [E500_MU]>],
71 [7, 1, 1], // Latency = 4, Repeat rate = 1
73 E500_GPR_Bypass, E500_GPR_Bypass]>,
74 InstrItinData<IIC_IntMulHWU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
75 InstrStage<4, [E500_MU]>],
76 [7, 1, 1], // Latency = 4, Repeat rate = 1
78 E500_GPR_Bypass, E500_GPR_Bypass]>,
79 InstrItinData<IIC_IntMulLI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
80 InstrStage<4, [E500_MU]>],
81 [7, 1, 1], // Latency = 4, Repeat rate = 1
83 E500_GPR_Bypass, E500_GPR_Bypass]>,
84 InstrItinData<IIC_IntRotate, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
85 InstrStage<1, [E500_SU0, E500_SU1]>],
86 [4, 1, 1], // Latency = 1
88 E500_GPR_Bypass, E500_GPR_Bypass]>,
89 InstrItinData<IIC_IntShift, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
90 InstrStage<1, [E500_SU0, E500_SU1]>],
91 [4, 1, 1], // Latency = 1
93 E500_GPR_Bypass, E500_GPR_Bypass]>,
94 InstrItinData<IIC_IntTrapW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
95 InstrStage<2, [E500_SU0]>],
96 [5, 1], // Latency = 2, Repeat rate = 2
97 [E500_GPR_Bypass, E500_GPR_Bypass]>,
98 InstrItinData<IIC_BrB, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
99 InstrStage<1, [E500_BU]>],
100 [4, 1], // Latency = 1
101 [NoBypass, E500_GPR_Bypass]>,
102 InstrItinData<IIC_BrCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
103 InstrStage<1, [E500_BU]>],
104 [4, 1, 1], // Latency = 1
106 E500_CR_Bypass, E500_CR_Bypass]>,
107 InstrItinData<IIC_BrMCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
108 InstrStage<1, [E500_BU]>],
109 [4, 1], // Latency = 1
110 [E500_CR_Bypass, E500_CR_Bypass]>,
111 InstrItinData<IIC_BrMCRX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
112 InstrStage<1, [E500_SU0, E500_SU1]>],
113 [4, 1, 1], // Latency = 1
114 [E500_CR_Bypass, E500_GPR_Bypass]>,
115 InstrItinData<IIC_LdStDCBA, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
116 InstrStage<1, [E500_LSU_0]>],
117 [6, 1], // Latency = 3, Repeat rate = 1
118 [E500_GPR_Bypass, E500_GPR_Bypass]>,
119 InstrItinData<IIC_LdStDCBF, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
120 InstrStage<1, [E500_LSU_0]>],
121 [6, 1], // Latency = 3
122 [E500_GPR_Bypass, E500_GPR_Bypass]>,
123 InstrItinData<IIC_LdStDCBI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
124 InstrStage<1, [E500_LSU_0]>],
125 [6, 1], // Latency = 3
126 [E500_GPR_Bypass, E500_GPR_Bypass]>,
127 InstrItinData<IIC_LdStLoad, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
128 InstrStage<1, [E500_LSU_0]>],
129 [6, 1], // Latency = 3
130 [E500_GPR_Bypass, E500_GPR_Bypass]>,
131 InstrItinData<IIC_LdStLoadUpd, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
132 InstrStage<1, [E500_SU0, E500_SU1], 0>,
133 InstrStage<1, [E500_LSU_0]>],
134 [6, 1], // Latency = 3
135 [E500_GPR_Bypass, E500_GPR_Bypass],
137 InstrItinData<IIC_LdStLoadUpdX,[InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
138 InstrStage<1, [E500_SU0, E500_SU1], 0>,
139 InstrStage<1, [E500_LSU_0]>],
140 [6, 1], // Latency = 3
141 [E500_GPR_Bypass, E500_GPR_Bypass],
143 InstrItinData<IIC_LdStStore, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
144 InstrStage<1, [E500_LSU_0]>],
145 [6, 1], // Latency = 3
146 [NoBypass, E500_GPR_Bypass]>,
147 InstrItinData<IIC_LdStSTU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
148 InstrStage<1, [E500_SU0, E500_SU1], 0>,
149 InstrStage<1, [E500_LSU_0]>],
150 [6, 1], // Latency = 3
151 [NoBypass, E500_GPR_Bypass],
153 InstrItinData<IIC_LdStSTUX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
154 InstrStage<1, [E500_SU0, E500_SU1], 0>,
155 InstrStage<1, [E500_LSU_0]>],
156 [6, 1], // Latency = 3
157 [NoBypass, E500_GPR_Bypass],
159 InstrItinData<IIC_LdStICBI, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
160 InstrStage<1, [E500_LSU_0]>],
161 [6, 1], // Latency = 3
162 [NoBypass, E500_GPR_Bypass]>,
163 InstrItinData<IIC_LdStLHA, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
164 InstrStage<1, [E500_LSU_0]>],
165 [6, 1], // Latency = 3
166 [E500_GPR_Bypass, E500_GPR_Bypass]>,
167 InstrItinData<IIC_LdStLHAU, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
168 InstrStage<1, [E500_SU0, E500_SU1], 0>,
169 InstrStage<1, [E500_LSU_0]>],
170 [6, 1], // Latency = 3
171 [E500_GPR_Bypass, E500_GPR_Bypass]>,
172 InstrItinData<IIC_LdStLHAUX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
173 InstrStage<1, [E500_SU0, E500_SU1], 0>,
174 InstrStage<1, [E500_LSU_0]>],
175 [6, 1], // Latency = 3
176 [E500_GPR_Bypass, E500_GPR_Bypass]>,
177 InstrItinData<IIC_LdStLMW, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
178 InstrStage<1, [E500_LSU_0]>],
179 [7, 1], // Latency = r+3
180 [NoBypass, E500_GPR_Bypass]>,
181 InstrItinData<IIC_LdStLWARX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
182 InstrStage<3, [E500_LSU_0]>],
183 [6, 1, 1], // Latency = 3, Repeat rate = 3
185 E500_GPR_Bypass, E500_GPR_Bypass]>,
186 InstrItinData<IIC_LdStSTWCX, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
187 InstrStage<1, [E500_LSU_0]>],
188 [6, 1], // Latency = 3
189 [NoBypass, E500_GPR_Bypass]>,
190 InstrItinData<IIC_LdStSync, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
191 InstrStage<1, [E500_LSU_0]>]>,
192 InstrItinData<IIC_SprMFSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
193 InstrStage<4, [E500_SU0]>],
195 [E500_GPR_Bypass, E500_GPR_Bypass]>,
196 InstrItinData<IIC_SprMTMSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
197 InstrStage<2, [E500_SU0, E500_SU1]>],
198 [5, 1], // Latency = 2, Repeat rate = 4
199 [E500_GPR_Bypass, E500_GPR_Bypass]>,
200 InstrItinData<IIC_SprMTSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
201 InstrStage<1, [E500_SU0]>],
203 [NoBypass, E500_GPR_Bypass]>,
204 InstrItinData<IIC_SprTLBSYNC, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
205 InstrStage<1, [E500_LSU_0], 0>]>,
206 InstrItinData<IIC_SprMFCR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
207 InstrStage<5, [E500_SU0]>],
209 [E500_GPR_Bypass, E500_CR_Bypass]>,
210 InstrItinData<IIC_SprMFCRF, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
211 InstrStage<5, [E500_SU0]>],
213 [E500_GPR_Bypass, E500_CR_Bypass]>,
214 InstrItinData<IIC_SprMFPMR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
215 InstrStage<4, [E500_SU0]>],
216 [7, 1], // Latency = 4, Repeat rate = 4
217 [E500_GPR_Bypass, E500_GPR_Bypass]>,
218 InstrItinData<IIC_SprMFMSR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
219 InstrStage<4, [E500_SU0]>],
220 [7, 1], // Latency = 4, Repeat rate = 4
221 [E500_GPR_Bypass, E500_GPR_Bypass]>,
222 InstrItinData<IIC_SprMFSPR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
223 InstrStage<1, [E500_SU0, E500_SU1]>],
224 [4, 1], // Latency = 1, Repeat rate = 1
225 [E500_GPR_Bypass, E500_CR_Bypass]>,
226 InstrItinData<IIC_SprMTPMR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
227 InstrStage<1, [E500_SU0]>],
228 [4, 1], // Latency = 1, Repeat rate = 1
229 [E500_CR_Bypass, E500_GPR_Bypass]>,
230 InstrItinData<IIC_SprMFTB, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
231 InstrStage<4, [E500_SU0]>],
232 [7, 1], // Latency = 4, Repeat rate = 4
233 [NoBypass, E500_GPR_Bypass]>,
234 InstrItinData<IIC_SprMTSPR, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
235 InstrStage<1, [E500_SU0, E500_SU1]>],
236 [4, 1], // Latency = 1, Repeat rate = 1
237 [E500_CR_Bypass, E500_GPR_Bypass]>,
238 InstrItinData<IIC_SprMTSRIN, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
239 InstrStage<1, [E500_SU0]>],
241 [NoBypass, E500_GPR_Bypass]>,
242 InstrItinData<IIC_FPDGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
243 InstrStage<6, [E500_MU]>],
244 [9, 1, 1], // Latency = 6, Repeat rate = 1
246 InstrItinData<IIC_FPSGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
247 InstrStage<4, [E500_MU]>],
248 [7, 1, 1], // Latency = 4, Repeat rate = 1
250 InstrItinData<IIC_FPDivD, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
251 InstrStage<32, [E500_MU]>],
252 [35, 1, 1], // Latency = 32, Repeat rate = 32
254 InstrItinData<IIC_FPDivS, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
255 InstrStage<29, [E500_MU]>],
256 [32, 1, 1], // Latency = 29, Repeat rate = 29
258 InstrItinData<IIC_VecGeneral, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
259 InstrStage<1, [E500_SU0]>],
260 [4, 1, 1], // Latency = 1, Repeat rate = 1
262 InstrItinData<IIC_VecComplex, [InstrStage<1, [E500_DIS0, E500_DIS1], 0>,
263 InstrStage<4, [E500_MU]>],
264 [7, 1, 1], // Latency = 4, Repeat rate = 1
268 // ===---------------------------------------------------------------------===//
269 // e500 machine model for scheduling and other instruction cost heuristics.
271 def PPCE500Model : SchedMachineModel {
272 let IssueWidth = 2; // 2 micro-ops are dispatched per cycle.
273 let LoadLatency = 5; // Optimistic load latency assuming bypass.
274 // This is overriden by OperandCycles if the
275 // Itineraries are queried instead.
277 let CompleteModel = 0;
279 let Itineraries = PPCE500Itineraries;