xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AArch64/AArch64SchedA57.td (revision 0c428864495af9dc7d2af4d0a5ae21732af9c739)
1//=- AArch64SchedA57.td - ARM Cortex-A57 Scheduling Defs -----*- tablegen -*-=//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the machine model for ARM Cortex-A57 to support
10// instruction scheduling and other instruction cost heuristics.
11//
12//===----------------------------------------------------------------------===//
13
14//===----------------------------------------------------------------------===//
15// The Cortex-A57 is a traditional superscalar microprocessor with a
16// conservative 3-wide in-order stage for decode and dispatch. Combined with the
17// much wider out-of-order issue stage, this produced a need to carefully
18// schedule micro-ops so that all three decoded each cycle are successfully
19// issued as the reservation station(s) simply don't stay occupied for long.
20// Therefore, IssueWidth is set to the narrower of the two at three, while still
21// modeling the machine as out-of-order.
22
23def CortexA57Model : SchedMachineModel {
24  let IssueWidth        =   3; // 3-way decode and dispatch
25  let MicroOpBufferSize = 128; // 128 micro-op re-order buffer
26  let LoadLatency       =   4; // Optimistic load latency
27  let MispredictPenalty =  14; // Fetch + Decode/Rename/Dispatch + Branch
28
29  // Enable partial & runtime unrolling. The magic number is chosen based on
30  // experiments and benchmarking data.
31  let LoopMicroOpBufferSize = 16;
32  let CompleteModel = 1;
33
34  list<Predicate> UnsupportedFeatures = !listconcat(SVEUnsupported.F,
35                                                    PAUnsupported.F,
36                                                    SMEUnsupported.F,
37                                                    [HasMTE]);
38}
39
40//===----------------------------------------------------------------------===//
41// Define each kind of processor resource and number available on Cortex-A57.
42// Cortex A-57 has 8 pipelines that each has its own 8-entry queue where
43// micro-ops wait for their operands and then issue out-of-order.
44
45def A57UnitB : ProcResource<1>;  // Type B micro-ops
46def A57UnitI : ProcResource<2>;  // Type I micro-ops
47def A57UnitM : ProcResource<1>;  // Type M micro-ops
48def A57UnitL : ProcResource<1>;  // Type L micro-ops
49def A57UnitS : ProcResource<1>;  // Type S micro-ops
50def A57UnitX : ProcResource<1>;  // Type X micro-ops
51def A57UnitW : ProcResource<1>;  // Type W micro-ops
52let SchedModel = CortexA57Model in {
53  def A57UnitV : ProcResGroup<[A57UnitX, A57UnitW]>;    // Type V micro-ops
54}
55
56let SchedModel = CortexA57Model in {
57
58//===----------------------------------------------------------------------===//
59// Define customized scheduler read/write types specific to the Cortex-A57.
60
61include "AArch64SchedA57WriteRes.td"
62
63//===----------------------------------------------------------------------===//
64// Map the target-defined scheduler read/write resources and latency for
65// Cortex-A57. The Cortex-A57 types are directly associated with resources, so
66// defining the aliases precludes the need for mapping them using WriteRes. The
67// aliases are sufficient for creating a coarse, working model. As the model
68// evolves, InstRWs will be used to override some of these SchedAliases.
69//
70// WARNING: Using SchedAliases is convenient and works well for latency and
71//          resource lookup for instructions. However, this creates an entry in
72//          AArch64WriteLatencyTable with a WriteResourceID of 0, breaking
73//          any SchedReadAdvance since the lookup will fail.
74
75def : SchedAlias<WriteImm,   A57Write_1cyc_1I>;
76def : SchedAlias<WriteI,     A57Write_1cyc_1I>;
77def : SchedAlias<WriteISReg, A57Write_2cyc_1M>;
78def : SchedAlias<WriteIEReg, A57Write_2cyc_1M>;
79def : SchedAlias<WriteExtr,  A57Write_1cyc_1I>;
80def : SchedAlias<WriteIS,    A57Write_1cyc_1I>;
81def : SchedAlias<WriteID32,  A57Write_19cyc_1M>;
82def : SchedAlias<WriteID64,  A57Write_35cyc_1M>;
83def : WriteRes<WriteIM32, [A57UnitM]> { let Latency = 3; }
84def : WriteRes<WriteIM64, [A57UnitM]> { let Latency = 5; }
85def : SchedAlias<WriteBr,    A57Write_1cyc_1B>;
86def : SchedAlias<WriteBrReg, A57Write_1cyc_1B>;
87def : SchedAlias<WriteLD,    A57Write_4cyc_1L>;
88def : SchedAlias<WriteST,    A57Write_1cyc_1S>;
89def : SchedAlias<WriteSTP,   A57Write_1cyc_1S>;
90def : SchedAlias<WriteAdr,   A57Write_1cyc_1I>;
91def : SchedAlias<WriteLDIdx, A57Write_4cyc_1I_1L>;
92def : SchedAlias<WriteSTIdx, A57Write_1cyc_1I_1S>;
93def : SchedAlias<WriteF,     A57Write_3cyc_1V>;
94def : SchedAlias<WriteFCmp,  A57Write_3cyc_1V>;
95def : SchedAlias<WriteFCvt,  A57Write_5cyc_1V>;
96def : SchedAlias<WriteFCopy, A57Write_5cyc_1L>;
97def : SchedAlias<WriteFImm,  A57Write_3cyc_1V>;
98def : WriteRes<WriteFMul, [A57UnitV]> { let Latency = 5;}
99def : SchedAlias<WriteFDiv,  A57Write_17cyc_1W>;
100def : SchedAlias<WriteVd,    A57Write_3cyc_1V>;
101def : SchedAlias<WriteVq,    A57Write_3cyc_1V>;
102def : SchedAlias<WriteVLD,   A57Write_5cyc_1L>;
103def : SchedAlias<WriteVST,   A57Write_1cyc_1S>;
104
105def : WriteRes<WriteAtomic,  []> { let Unsupported = 1; }
106
107def : WriteRes<WriteSys,     []> { let Latency = 1; }
108def : WriteRes<WriteBarrier, []> { let Latency = 1; }
109def : WriteRes<WriteHint,    []> { let Latency = 1; }
110
111def : WriteRes<WriteLDHi,    []> { let Latency = 4; }
112
113// Forwarding logic is only modeled for multiply and accumulate
114def : ReadAdvance<ReadI,       0>;
115def : ReadAdvance<ReadISReg,   0>;
116def : ReadAdvance<ReadIEReg,   0>;
117def : ReadAdvance<ReadIM,      0>;
118def : ReadAdvance<ReadIMA,     2, [WriteIM32, WriteIM64]>;
119def : ReadAdvance<ReadID,      0>;
120def : ReadAdvance<ReadExtrHi,  0>;
121def : ReadAdvance<ReadST,      0>;
122def : ReadAdvance<ReadAdrBase, 0>;
123def : ReadAdvance<ReadVLD,     0>;
124
125
126//===----------------------------------------------------------------------===//
127// Specialize the coarse model by associating instruction groups with the
128// subtarget-defined types. As the modeled is refined, this will override most
129// of the above ShchedAlias mappings.
130
131// Miscellaneous
132// -----------------------------------------------------------------------------
133
134def : InstRW<[WriteI], (instrs COPY)>;
135
136
137// Branch Instructions
138// -----------------------------------------------------------------------------
139
140def : InstRW<[A57Write_1cyc_1B_1I], (instrs BL)>;
141def : InstRW<[A57Write_2cyc_1B_1I], (instrs BLR)>;
142
143
144// Shifted Register with Shift == 0
145// ----------------------------------------------------------------------------
146
147def A57WriteISReg : SchedWriteVariant<[
148       SchedVar<RegShiftedPred, [WriteISReg]>,
149       SchedVar<NoSchedPred, [WriteI]>]>;
150def : InstRW<[A57WriteISReg], (instregex ".*rs$")>;
151
152
153// Divide and Multiply Instructions
154// -----------------------------------------------------------------------------
155
156// Multiply high
157def : InstRW<[A57Write_6cyc_1M], (instrs SMULHrr, UMULHrr)>;
158
159
160// Miscellaneous Data-Processing Instructions
161// -----------------------------------------------------------------------------
162
163def : InstRW<[A57Write_1cyc_1I],    (instrs EXTRWrri)>;
164def : InstRW<[A57Write_3cyc_1I_1M], (instrs EXTRXrri)>;
165def : InstRW<[A57Write_2cyc_1M],    (instregex "BFM")>;
166
167
168// Cryptography Extensions
169// -----------------------------------------------------------------------------
170
171def A57ReadAES  : SchedReadAdvance<3, [A57Write_3cyc_1W]>;
172def : InstRW<[A57Write_3cyc_1W], (instregex "^AES[DE]")>;
173def : InstRW<[A57Write_3cyc_1W, A57ReadAES], (instregex "^AESI?MC")>;
174def : InstRW<[A57Write_6cyc_2V], (instregex "^SHA1SU0")>;
175def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA1(H|SU1)")>;
176def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA1[CMP]")>;
177def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA256SU0")>;
178def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA256(H|H2|SU1)")>;
179def : InstRW<[A57Write_3cyc_1W], (instregex "^CRC32")>;
180
181
182// Vector Load
183// -----------------------------------------------------------------------------
184
185def : InstRW<[A57Write_8cyc_1L_1V],           (instregex "LD1i(8|16|32)$")>;
186def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD1i(8|16|32)_POST$")>;
187def : InstRW<[A57Write_5cyc_1L],            (instregex "LD1i(64)$")>;
188def : InstRW<[A57Write_5cyc_1L, WriteAdr],  (instregex "LD1i(64)_POST$")>;
189
190def : InstRW<[A57Write_8cyc_1L_1V],           (instregex "LD1Rv(8b|4h|2s)$")>;
191def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD1Rv(8b|4h|2s)_POST$")>;
192def : InstRW<[A57Write_5cyc_1L],            (instregex "LD1Rv(1d)$")>;
193def : InstRW<[A57Write_5cyc_1L, WriteAdr],  (instregex "LD1Rv(1d)_POST$")>;
194def : InstRW<[A57Write_8cyc_1L_1V],           (instregex "LD1Rv(16b|8h|4s|2d)$")>;
195def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr], (instregex "LD1Rv(16b|8h|4s|2d)_POST$")>;
196
197def : InstRW<[A57Write_5cyc_1L],              (instregex "LD1Onev(8b|4h|2s|1d)$")>;
198def : InstRW<[A57Write_5cyc_1L, WriteAdr],    (instregex "LD1Onev(8b|4h|2s|1d)_POST$")>;
199def : InstRW<[A57Write_5cyc_1L],              (instregex "LD1Onev(16b|8h|4s|2d)$")>;
200def : InstRW<[A57Write_5cyc_1L, WriteAdr],    (instregex "LD1Onev(16b|8h|4s|2d)_POST$")>;
201def : InstRW<[A57Write_5cyc_1L],              (instregex "LD1Twov(8b|4h|2s|1d)$")>;
202def : InstRW<[A57Write_5cyc_1L, WriteAdr],    (instregex "LD1Twov(8b|4h|2s|1d)_POST$")>;
203def : InstRW<[A57Write_6cyc_2L],             (instregex "LD1Twov(16b|8h|4s|2d)$")>;
204def : InstRW<[A57Write_6cyc_2L, WriteAdr],   (instregex "LD1Twov(16b|8h|4s|2d)_POST$")>;
205def : InstRW<[A57Write_6cyc_2L],             (instregex "LD1Threev(8b|4h|2s|1d)$")>;
206def : InstRW<[A57Write_6cyc_2L, WriteAdr],   (instregex "LD1Threev(8b|4h|2s|1d)_POST$")>;
207def : InstRW<[A57Write_7cyc_3L],            (instregex "LD1Threev(16b|8h|4s|2d)$")>;
208def : InstRW<[A57Write_7cyc_3L, WriteAdr],  (instregex "LD1Threev(16b|8h|4s|2d)_POST$")>;
209def : InstRW<[A57Write_6cyc_2L],             (instregex "LD1Fourv(8b|4h|2s|1d)$")>;
210def : InstRW<[A57Write_6cyc_2L, WriteAdr],   (instregex "LD1Fourv(8b|4h|2s|1d)_POST$")>;
211def : InstRW<[A57Write_8cyc_4L],           (instregex "LD1Fourv(16b|8h|4s|2d)$")>;
212def : InstRW<[A57Write_8cyc_4L, WriteAdr], (instregex "LD1Fourv(16b|8h|4s|2d)_POST$")>;
213
214def : InstRW<[A57Write_8cyc_1L_2V],           (instregex "LD2i(8|16)$")>;
215def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD2i(8|16)_POST$")>;
216def : InstRW<[A57Write_6cyc_2L],            (instregex "LD2i(32)$")>;
217def : InstRW<[A57Write_6cyc_2L, WriteAdr],  (instregex "LD2i(32)_POST$")>;
218def : InstRW<[A57Write_8cyc_1L_1V],            (instregex "LD2i(64)$")>;
219def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr],  (instregex "LD2i(64)_POST$")>;
220
221def : InstRW<[A57Write_8cyc_1L_1V],            (instregex "LD2Rv(8b|4h|2s)$")>;
222def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr],  (instregex "LD2Rv(8b|4h|2s)_POST$")>;
223def : InstRW<[A57Write_5cyc_1L],             (instregex "LD2Rv(1d)$")>;
224def : InstRW<[A57Write_5cyc_1L, WriteAdr],   (instregex "LD2Rv(1d)_POST$")>;
225def : InstRW<[A57Write_8cyc_1L_2V],           (instregex "LD2Rv(16b|8h|4s|2d)$")>;
226def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr], (instregex "LD2Rv(16b|8h|4s|2d)_POST$")>;
227
228def : InstRW<[A57Write_8cyc_1L_1V],             (instregex "LD2Twov(8b|4h|2s)$")>;
229def : InstRW<[A57Write_8cyc_1L_1V, WriteAdr],   (instregex "LD2Twov(8b|4h|2s)_POST$")>;
230def : InstRW<[A57Write_9cyc_2L_2V],           (instregex "LD2Twov(16b|8h|4s)$")>;
231def : InstRW<[A57Write_9cyc_2L_2V, WriteAdr], (instregex "LD2Twov(16b|8h|4s)_POST$")>;
232def : InstRW<[A57Write_6cyc_2L],             (instregex "LD2Twov(2d)$")>;
233def : InstRW<[A57Write_6cyc_2L, WriteAdr],   (instregex "LD2Twov(2d)_POST$")>;
234
235def : InstRW<[A57Write_9cyc_1L_3V],           (instregex "LD3i(8|16)$")>;
236def : InstRW<[A57Write_9cyc_1L_3V, WriteAdr], (instregex "LD3i(8|16)_POST$")>;
237def : InstRW<[A57Write_8cyc_1L_2V],            (instregex "LD3i(32)$")>;
238def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr],  (instregex "LD3i(32)_POST$")>;
239def : InstRW<[A57Write_6cyc_2L],             (instregex "LD3i(64)$")>;
240def : InstRW<[A57Write_6cyc_2L, WriteAdr],   (instregex "LD3i(64)_POST$")>;
241
242def : InstRW<[A57Write_8cyc_1L_2V],             (instregex "LD3Rv(8b|4h|2s)$")>;
243def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr],   (instregex "LD3Rv(8b|4h|2s)_POST$")>;
244def : InstRW<[A57Write_6cyc_2L],              (instregex "LD3Rv(1d)$")>;
245def : InstRW<[A57Write_6cyc_2L, WriteAdr],    (instregex "LD3Rv(1d)_POST$")>;
246def : InstRW<[A57Write_9cyc_1L_3V],            (instregex "LD3Rv(16b|8h|4s)$")>;
247def : InstRW<[A57Write_9cyc_1L_3V, WriteAdr],  (instregex "LD3Rv(16b|8h|4s)_POST$")>;
248def : InstRW<[A57Write_9cyc_2L_3V],           (instregex "LD3Rv(2d)$")>;
249def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD3Rv(2d)_POST$")>;
250
251def : InstRW<[A57Write_9cyc_2L_2V],               (instregex "LD3Threev(8b|4h|2s)$")>;
252def : InstRW<[A57Write_9cyc_2L_2V, WriteAdr],     (instregex "LD3Threev(8b|4h|2s)_POST$")>;
253def : InstRW<[A57Write_10cyc_3L_4V],           (instregex "LD3Threev(16b|8h|4s)$")>;
254def : InstRW<[A57Write_10cyc_3L_4V, WriteAdr], (instregex "LD3Threev(16b|8h|4s)_POST$")>;
255def : InstRW<[A57Write_8cyc_4L],               (instregex "LD3Threev(2d)$")>;
256def : InstRW<[A57Write_8cyc_4L, WriteAdr],     (instregex "LD3Threev(2d)_POST$")>;
257
258def : InstRW<[A57Write_9cyc_2L_3V],           (instregex "LD4i(8|16)$")>;
259def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD4i(8|16)_POST$")>;
260def : InstRW<[A57Write_8cyc_1L_2V],             (instregex "LD4i(32)$")>;
261def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr],   (instregex "LD4i(32)_POST$")>;
262def : InstRW<[A57Write_9cyc_2L_3V],           (instregex "LD4i(64)$")>;
263def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr], (instregex "LD4i(64)_POST$")>;
264
265def : InstRW<[A57Write_8cyc_1L_2V],              (instregex "LD4Rv(8b|4h|2s)$")>;
266def : InstRW<[A57Write_8cyc_1L_2V, WriteAdr],    (instregex "LD4Rv(8b|4h|2s)_POST$")>;
267def : InstRW<[A57Write_6cyc_2L],               (instregex "LD4Rv(1d)$")>;
268def : InstRW<[A57Write_6cyc_2L, WriteAdr],     (instregex "LD4Rv(1d)_POST$")>;
269def : InstRW<[A57Write_9cyc_2L_3V],            (instregex "LD4Rv(16b|8h|4s)$")>;
270def : InstRW<[A57Write_9cyc_2L_3V, WriteAdr],  (instregex "LD4Rv(16b|8h|4s)_POST$")>;
271def : InstRW<[A57Write_9cyc_2L_4V],           (instregex "LD4Rv(2d)$")>;
272def : InstRW<[A57Write_9cyc_2L_4V, WriteAdr], (instregex "LD4Rv(2d)_POST$")>;
273
274def : InstRW<[A57Write_9cyc_2L_2V],                (instregex "LD4Fourv(8b|4h|2s)$")>;
275def : InstRW<[A57Write_9cyc_2L_2V, WriteAdr],      (instregex "LD4Fourv(8b|4h|2s)_POST$")>;
276def : InstRW<[A57Write_11cyc_4L_4V],           (instregex "LD4Fourv(16b|8h|4s)$")>;
277def : InstRW<[A57Write_11cyc_4L_4V, WriteAdr], (instregex "LD4Fourv(16b|8h|4s)_POST$")>;
278def : InstRW<[A57Write_8cyc_4L],                (instregex "LD4Fourv(2d)$")>;
279def : InstRW<[A57Write_8cyc_4L, WriteAdr],      (instregex "LD4Fourv(2d)_POST$")>;
280
281// Vector Store
282// -----------------------------------------------------------------------------
283
284def : InstRW<[A57Write_1cyc_1S],            (instregex "ST1i(8|16|32)$")>;
285def : InstRW<[A57Write_1cyc_1S, WriteAdr],  (instregex "ST1i(8|16|32)_POST$")>;
286def : InstRW<[A57Write_3cyc_1S_1V],           (instregex "ST1i(64)$")>;
287def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr], (instregex "ST1i(64)_POST$")>;
288
289def : InstRW<[A57Write_1cyc_1S],                  (instregex "ST1Onev(8b|4h|2s|1d)$")>;
290def : InstRW<[A57Write_1cyc_1S, WriteAdr],        (instregex "ST1Onev(8b|4h|2s|1d)_POST$")>;
291def : InstRW<[A57Write_2cyc_2S],                 (instregex "ST1Onev(16b|8h|4s|2d)$")>;
292def : InstRW<[A57Write_2cyc_2S, WriteAdr],       (instregex "ST1Onev(16b|8h|4s|2d)_POST$")>;
293def : InstRW<[A57Write_2cyc_2S],                 (instregex "ST1Twov(8b|4h|2s|1d)$")>;
294def : InstRW<[A57Write_2cyc_2S, WriteAdr],       (instregex "ST1Twov(8b|4h|2s|1d)_POST$")>;
295def : InstRW<[A57Write_4cyc_4S],               (instregex "ST1Twov(16b|8h|4s|2d)$")>;
296def : InstRW<[A57Write_4cyc_4S, WriteAdr],     (instregex "ST1Twov(16b|8h|4s|2d)_POST$")>;
297def : InstRW<[A57Write_3cyc_3S],                (instregex "ST1Threev(8b|4h|2s|1d)$")>;
298def : InstRW<[A57Write_3cyc_3S, WriteAdr],      (instregex "ST1Threev(8b|4h|2s|1d)_POST$")>;
299def : InstRW<[A57Write_6cyc_6S],             (instregex "ST1Threev(16b|8h|4s|2d)$")>;
300def : InstRW<[A57Write_6cyc_6S, WriteAdr],   (instregex "ST1Threev(16b|8h|4s|2d)_POST$")>;
301def : InstRW<[A57Write_4cyc_4S],               (instregex "ST1Fourv(8b|4h|2s|1d)$")>;
302def : InstRW<[A57Write_4cyc_4S, WriteAdr],     (instregex "ST1Fourv(8b|4h|2s|1d)_POST$")>;
303def : InstRW<[A57Write_8cyc_8S],           (instregex "ST1Fourv(16b|8h|4s|2d)$")>;
304def : InstRW<[A57Write_8cyc_8S, WriteAdr], (instregex "ST1Fourv(16b|8h|4s|2d)_POST$")>;
305
306def : InstRW<[A57Write_3cyc_1S_1V],           (instregex "ST2i(8|16|32)$")>;
307def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr], (instregex "ST2i(8|16|32)_POST$")>;
308def : InstRW<[A57Write_2cyc_2S],           (instregex "ST2i(64)$")>;
309def : InstRW<[A57Write_2cyc_2S, WriteAdr], (instregex "ST2i(64)_POST$")>;
310
311def : InstRW<[A57Write_3cyc_2S_1V],              (instregex "ST2Twov(8b|4h|2s)$")>;
312def : InstRW<[A57Write_3cyc_2S_1V, WriteAdr],    (instregex "ST2Twov(8b|4h|2s)_POST$")>;
313def : InstRW<[A57Write_4cyc_4S_2V],           (instregex "ST2Twov(16b|8h|4s)$")>;
314def : InstRW<[A57Write_4cyc_4S_2V, WriteAdr], (instregex "ST2Twov(16b|8h|4s)_POST$")>;
315def : InstRW<[A57Write_4cyc_4S],             (instregex "ST2Twov(2d)$")>;
316def : InstRW<[A57Write_4cyc_4S, WriteAdr],   (instregex "ST2Twov(2d)_POST$")>;
317
318def : InstRW<[A57Write_3cyc_1S_1V],            (instregex "ST3i(8|16)$")>;
319def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr],  (instregex "ST3i(8|16)_POST$")>;
320def : InstRW<[A57Write_3cyc_3S],           (instregex "ST3i(32)$")>;
321def : InstRW<[A57Write_3cyc_3S, WriteAdr], (instregex "ST3i(32)_POST$")>;
322def : InstRW<[A57Write_3cyc_2S_1V],           (instregex "ST3i(64)$")>;
323def : InstRW<[A57Write_3cyc_2S_1V, WriteAdr], (instregex "ST3i(64)_POST$")>;
324
325def : InstRW<[A57Write_3cyc_3S_2V],                 (instregex "ST3Threev(8b|4h|2s)$")>;
326def : InstRW<[A57Write_3cyc_3S_2V, WriteAdr],       (instregex "ST3Threev(8b|4h|2s)_POST$")>;
327def : InstRW<[A57Write_6cyc_6S_4V],           (instregex "ST3Threev(16b|8h|4s)$")>;
328def : InstRW<[A57Write_6cyc_6S_4V, WriteAdr], (instregex "ST3Threev(16b|8h|4s)_POST$")>;
329def : InstRW<[A57Write_6cyc_6S],                (instregex "ST3Threev(2d)$")>;
330def : InstRW<[A57Write_6cyc_6S, WriteAdr],      (instregex "ST3Threev(2d)_POST$")>;
331
332def : InstRW<[A57Write_3cyc_1S_1V],             (instregex "ST4i(8|16)$")>;
333def : InstRW<[A57Write_3cyc_1S_1V, WriteAdr],   (instregex "ST4i(8|16)_POST$")>;
334def : InstRW<[A57Write_4cyc_4S],           (instregex "ST4i(32)$")>;
335def : InstRW<[A57Write_4cyc_4S, WriteAdr], (instregex "ST4i(32)_POST$")>;
336def : InstRW<[A57Write_3cyc_2S_1V],            (instregex "ST4i(64)$")>;
337def : InstRW<[A57Write_3cyc_2S_1V, WriteAdr],  (instregex "ST4i(64)_POST$")>;
338
339def : InstRW<[A57Write_4cyc_4S_2V],                  (instregex "ST4Fourv(8b|4h|2s)$")>;
340def : InstRW<[A57Write_4cyc_4S_2V, WriteAdr],        (instregex "ST4Fourv(8b|4h|2s)_POST$")>;
341def : InstRW<[A57Write_8cyc_8S_4V],           (instregex "ST4Fourv(16b|8h|4s)$")>;
342def : InstRW<[A57Write_8cyc_8S_4V, WriteAdr], (instregex "ST4Fourv(16b|8h|4s)_POST$")>;
343def : InstRW<[A57Write_8cyc_8S],                (instregex "ST4Fourv(2d)$")>;
344def : InstRW<[A57Write_8cyc_8S, WriteAdr],      (instregex "ST4Fourv(2d)_POST$")>;
345
346// Vector - Integer
347// -----------------------------------------------------------------------------
348
349// Reference for forms in this group
350//   D form - v8i8, v4i16, v2i32
351//   Q form - v16i8, v8i16, v4i32
352//   D form - v1i8, v1i16, v1i32, v1i64
353//   Q form - v16i8, v8i16, v4i32, v2i64
354//   D form - v8i8_v8i16, v4i16_v4i32, v2i32_v2i64
355//   Q form - v16i8_v8i16, v8i16_v4i32, v4i32_v2i64
356
357// Cortex A57 Software Optimization Guide Sec 3.14
358// Advance for absolute diff accum, pairwise add and accumulate, shift accumulate
359def A57ReadIVA3 : SchedReadAdvance<3, [A57Write_4cyc_1X_NonMul_Forward, A57Write_5cyc_2X_NonMul_Forward]>;
360
361// ASIMD absolute diff accum, D-form
362def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v8i8|v4i16|v2i32)$")>;
363// ASIMD absolute diff accum, Q-form
364def : InstRW<[A57Write_5cyc_2X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v16i8|v8i16|v4i32)$")>;
365// ASIMD absolute diff accum long
366def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABAL")>;
367
368// ASIMD arith, reduce, 4H/4S
369def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?ADDL?V(v8i8|v4i16|v2i32)v$")>;
370// ASIMD arith, reduce, 8B/8H
371def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU]?ADDL?V(v8i16|v4i32)v$")>;
372// ASIMD arith, reduce, 16B
373def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU]?ADDL?Vv16i8v$")>;
374
375// ASIMD max/min, reduce, 4H/4S
376def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU](MIN|MAX)V(v4i16|v4i32)v$")>;
377// ASIMD max/min, reduce, 8B/8H
378def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU](MIN|MAX)V(v8i8|v8i16)v$")>;
379// ASIMD max/min, reduce, 16B
380def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU](MIN|MAX)Vv16i8v$")>;
381
382// ASIMD multiply, D-form
383// MUL
384def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^MUL(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>;
385// PMUL, SQDMULH, SQRDMULH
386def : InstRW<[A57Write_5cyc_1W], (instregex "^(PMUL|SQR?DMULH)(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>;
387
388// ASIMD multiply, Q-form
389// MUL
390def : InstRW<[A57Write_6cyc_2W_Mul_Forward], (instregex "^MUL(v16i8|v8i16|v4i32)(_indexed)?$")>;
391// PMUL, SQDMULH, SQRDMULH
392def : InstRW<[A57Write_6cyc_2W], (instregex "^(PMUL|SQR?DMULH)(v16i8|v8i16|v4i32)(_indexed)?$")>;
393
394// Cortex A57 Software Optimization Guide Sec 3.14
395def A57ReadIVMA4   : SchedReadAdvance<4 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>;
396def A57ReadIVMA3   : SchedReadAdvance<3 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>;
397
398// ASIMD multiply accumulate, D-form
399def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v8i8|v4i16|v2i32)(_indexed)?$")>;
400// ASIMD multiply accumulate, Q-form
401def : InstRW<[A57Write_6cyc_2W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v16i8|v8i16|v4i32)(_indexed)?$")>;
402
403// ASIMD multiply accumulate long
404// ASIMD multiply accumulate saturating long
405def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^(S|U)ML[AS]L")>;
406def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA3], (instregex "^SQDML[AS]L")>;
407
408// ASIMD multiply long
409def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^(S|U)MULL")>;
410def : InstRW<[A57Write_5cyc_1W], (instregex "^SQDMULL")>;
411def : InstRW<[A57Write_5cyc_1W], (instregex "^PMULL(v8i8|v16i8)")>;
412def : InstRW<[A57Write_3cyc_1W], (instregex "^PMULL(v1i64|v2i64)")>;
413
414// ASIMD pairwise add and accumulate
415// ASIMD shift accumulate
416def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ADALP")>;
417def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^(S|SR|U|UR)SRA")>;
418
419// ASIMD shift by immed, complex
420def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?(Q|R){1,2}SHR")>;
421def : InstRW<[A57Write_4cyc_1X], (instregex "^SQSHLU")>;
422
423
424// ASIMD shift by register, basic, Q-form
425def : InstRW<[A57Write_4cyc_2X], (instregex "^[SU]SHL(v16i8|v8i16|v4i32|v2i64)")>;
426
427// ASIMD shift by register, complex, D-form
428def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU][QR]{1,2}SHL(v1i8|v1i16|v1i32|v1i64|v8i8|v4i16|v2i32|b|d|h|s)")>;
429
430// ASIMD shift by register, complex, Q-form
431def : InstRW<[A57Write_5cyc_2X], (instregex "^[SU][QR]{1,2}SHL(v16i8|v8i16|v4i32|v2i64)")>;
432
433
434// Vector - Floating Point
435// -----------------------------------------------------------------------------
436
437// Reference for forms in this group
438//   D form - v2f32
439//   Q form - v4f32, v2f64
440//   D form - 32, 64
441//   D form - v1i32, v1i64
442//   D form - v2i32
443//   Q form - v4i32, v2i64
444
445// ASIMD FP arith, normal, D-form
446def : InstRW<[A57Write_5cyc_1V], (instregex "^(FABD|FADD|FSUB)(v2f32|32|64|v2i32p)")>;
447// ASIMD FP arith, normal, Q-form
448def : InstRW<[A57Write_5cyc_2V], (instregex "^(FABD|FADD|FSUB)(v4f32|v2f64|v2i64p)")>;
449
450// ASIMD FP arith, pairwise, D-form
451def : InstRW<[A57Write_5cyc_1V], (instregex "^FADDP(v2f32|32|64|v2i32)")>;
452// ASIMD FP arith, pairwise, Q-form
453def : InstRW<[A57Write_9cyc_3V], (instregex "^FADDP(v4f32|v2f64|v2i64)")>;
454
455// ASIMD FP compare, D-form
456def : InstRW<[A57Write_5cyc_1V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v2f32|32|64|v1i32|v2i32|v1i64)")>;
457// ASIMD FP compare, Q-form
458def : InstRW<[A57Write_5cyc_2V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v4f32|v2f64|v4i32|v2i64)")>;
459
460// ASIMD FP convert, long and narrow
461def : InstRW<[A57Write_8cyc_3V], (instregex "^FCVT(L|N|XN)v")>;
462// ASIMD FP convert, other, D-form
463def : InstRW<[A57Write_5cyc_1V], (instregex "^[FSU]CVT([AMNPZ][SU])?(_Int)?(v2f32|v1i32|v2i32|v1i64)")>;
464// ASIMD FP convert, other, Q-form
465def : InstRW<[A57Write_5cyc_2V], (instregex "^[FSU]CVT([AMNPZ][SU])?(_Int)?(v4f32|v2f64|v4i32|v2i64)")>;
466
467// ASIMD FP divide, D-form, F32
468def : InstRW<[A57Write_17cyc_1W], (instregex "FDIVv2f32")>;
469// ASIMD FP divide, Q-form, F32
470def : InstRW<[A57Write_34cyc_2W], (instregex "FDIVv4f32")>;
471// ASIMD FP divide, Q-form, F64
472def : InstRW<[A57Write_64cyc_2W], (instregex "FDIVv2f64")>;
473
474// Note: These were simply duplicated from ASIMD FDIV because of missing documentation
475// ASIMD FP square root, D-form, F32
476def : InstRW<[A57Write_17cyc_1W], (instregex "FSQRTv2f32")>;
477// ASIMD FP square root, Q-form, F32
478def : InstRW<[A57Write_34cyc_2W], (instregex "FSQRTv4f32")>;
479// ASIMD FP square root, Q-form, F64
480def : InstRW<[A57Write_64cyc_2W], (instregex "FSQRTv2f64")>;
481
482// ASIMD FP max/min, normal, D-form
483def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?(v2f32)")>;
484// ASIMD FP max/min, normal, Q-form
485def : InstRW<[A57Write_5cyc_2V], (instregex "^(FMAX|FMIN)(NM)?(v4f32|v2f64)")>;
486// ASIMD FP max/min, pairwise, D-form
487def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?P(v2f32|v2i32)")>;
488// ASIMD FP max/min, pairwise, Q-form
489def : InstRW<[A57Write_9cyc_3V], (instregex "^(FMAX|FMIN)(NM)?P(v4f32|v2f64|v2i64)")>;
490// ASIMD FP max/min, reduce
491def : InstRW<[A57Write_10cyc_3V], (instregex "^(FMAX|FMIN)(NM)?Vv")>;
492
493// ASIMD FP multiply, D-form, FZ
494def : InstRW<[A57Write_5cyc_1V_FP_Forward], (instregex "^FMULX?(v2f32|v1i32|v2i32|v1i64|32|64)")>;
495// ASIMD FP multiply, Q-form, FZ
496def : InstRW<[A57Write_5cyc_2V_FP_Forward], (instregex "^FMULX?(v4f32|v2f64|v4i32|v2i64)")>;
497
498// ASIMD FP multiply accumulate, D-form, FZ
499// ASIMD FP multiply accumulate, Q-form, FZ
500def A57WriteFPVMAD : SchedWriteRes<[A57UnitV]> { let Latency = 9;  }
501def A57WriteFPVMAQ : SchedWriteRes<[A57UnitV, A57UnitV]> { let Latency = 10;  }
502
503// Cortex A57 Software Optimization Guide Sec 3.15
504// Advances from FP mul and mul-accum to mul-accum
505def A57ReadFPVMA5  : SchedReadAdvance<5, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>;
506def A57ReadFPVMA6  : SchedReadAdvance<6, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>;
507
508def : InstRW<[A57WriteFPVMAD, A57ReadFPVMA5], (instregex "^FML[AS](v2f32|v1i32|v2i32|v1i64)")>;
509def : InstRW<[A57WriteFPVMAQ, A57ReadFPVMA6], (instregex "^FML[AS](v4f32|v2f64|v4i32|v2i64)")>;
510
511// ASIMD FP round, D-form
512def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT[AIMNPXZ](v2f32)")>;
513// ASIMD FP round, Q-form
514def : InstRW<[A57Write_5cyc_2V], (instregex "^FRINT[AIMNPXZ](v4f32|v2f64)")>;
515
516
517// Vector - Miscellaneous
518// -----------------------------------------------------------------------------
519
520// Reference for forms in this group
521//   D form - v8i8, v4i16, v2i32
522//   Q form - v16i8, v8i16, v4i32
523//   D form - v1i8, v1i16, v1i32, v1i64
524//   Q form - v16i8, v8i16, v4i32, v2i64
525
526// ASIMD bitwise insert, Q-form
527def : InstRW<[A57Write_3cyc_2V], (instregex "^(BIF|BIT|BSL|BSP)v16i8")>;
528
529// ASIMD duplicate, gen reg, D-form and Q-form
530def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUP(i8|i16|i32|i64)$")>;
531def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUPv.+gpr")>;
532
533// ASIMD move, saturating
534def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]QXTU?N")>;
535
536// ASIMD reciprocal estimate, D-form
537def : InstRW<[A57Write_5cyc_1V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f32|v1i32|v2i32|v1i64)")>;
538// ASIMD reciprocal estimate, Q-form
539def : InstRW<[A57Write_5cyc_2V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f64|v4f32|v4i32)")>;
540
541// ASIMD reciprocal step, D-form, FZ
542def : InstRW<[A57Write_9cyc_1V], (instregex "^F(RECP|RSQRT)S(v2f32|v1i32|v2i32|v1i64|32|64)")>;
543// ASIMD reciprocal step, Q-form, FZ
544def : InstRW<[A57Write_9cyc_2V], (instregex "^F(RECP|RSQRT)S(v2f64|v4f32|v4i32)")>;
545
546// ASIMD table lookup, D-form
547def : InstRW<[A57Write_3cyc_1V], (instregex "^TB[LX]v8i8One")>;
548def : InstRW<[A57Write_6cyc_2V], (instregex "^TB[LX]v8i8Two")>;
549def : InstRW<[A57Write_9cyc_3V], (instregex "^TB[LX]v8i8Three")>;
550def : InstRW<[A57Write_12cyc_4V], (instregex "^TB[LX]v8i8Four")>;
551// ASIMD table lookup, Q-form
552def : InstRW<[A57Write_6cyc_3V], (instregex "^TB[LX]v16i8One")>;
553def : InstRW<[A57Write_9cyc_5V], (instregex "^TB[LX]v16i8Two")>;
554def : InstRW<[A57Write_12cyc_7V], (instregex "^TB[LX]v16i8Three")>;
555def : InstRW<[A57Write_15cyc_9V], (instregex "^TB[LX]v16i8Four")>;
556
557// ASIMD transfer, element to gen reg
558def : InstRW<[A57Write_6cyc_1I_1L], (instregex "^[SU]MOVv")>;
559
560// ASIMD transfer, gen reg to element
561def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^INSv")>;
562
563// ASIMD unzip/zip, Q-form
564def : InstRW<[A57Write_6cyc_3V], (instregex "^(UZP|ZIP)(1|2)(v16i8|v8i16|v4i32|v2i64)")>;
565
566
567// Remainder
568// -----------------------------------------------------------------------------
569
570def : InstRW<[A57Write_5cyc_1V], (instregex "^F(ADD|SUB)[DS]rr")>;
571
572// Cortex A57 Software Optimization Guide Sec 3.10
573def A57WriteFPMA  : SchedWriteRes<[A57UnitV]> { let Latency = 9;  }
574def A57ReadFPMA5  : SchedReadAdvance<5, [A57WriteFPMA, WriteFMul]>;
575def A57ReadFPM    : SchedReadAdvance<0>;
576def : InstRW<[A57WriteFPMA, A57ReadFPM, A57ReadFPM, A57ReadFPMA5], (instregex "^FN?M(ADD|SUB)[DS]rrr")>;
577
578def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[FSU]CVT[AMNPZ][SU](_Int)?[SU]?[XW]?[DS]?[rds]i?")>;
579def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[SU]CVTF")>;
580
581def : InstRW<[A57Write_32cyc_1W], (instrs FDIVDrr)>;
582def : InstRW<[A57Write_17cyc_1W], (instrs FDIVSrr)>;
583
584def : InstRW<[A57Write_5cyc_1V], (instregex "^F(MAX|MIN).+rr")>;
585
586def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT.+r")>;
587
588def : InstRW<[A57Write_32cyc_1W], (instrs FSQRTDr)>;
589def : InstRW<[A57Write_17cyc_1W], (instrs FSQRTSr)>;
590
591def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPDi)>;
592def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDNPQi)>;
593def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPSi)>;
594def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPDi)>;
595def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPDpost)>;
596def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPDpre)>;
597def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDPQi)>;
598def : InstRW<[A57Write_6cyc_2L, WriteLDHi, WriteAdr], (instrs LDPQpost)>;
599def : InstRW<[A57Write_6cyc_2L, WriteLDHi, WriteAdr], (instrs LDPQpre)>;
600def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWi)>;
601def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi, WriteAdr], (instrs LDPSWpost)>;
602def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi, WriteAdr], (instrs LDPSWpre)>;
603def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPSi)>;
604def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPSpost)>;
605def : InstRW<[A57Write_5cyc_1L, WriteLDHi, WriteAdr], (instrs LDPSpre)>;
606def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRBpost)>;
607def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRBpre)>;
608def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroW)>;
609def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroX)>;
610def : InstRW<[A57Write_5cyc_1L], (instrs LDRBui)>;
611def : InstRW<[A57Write_5cyc_1L], (instrs LDRDl)>;
612def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRDpost)>;
613def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRDpre)>;
614def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroW)>;
615def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroX)>;
616def : InstRW<[A57Write_5cyc_1L], (instrs LDRDui)>;
617def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroW)>;
618def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroX)>;
619def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRHpost)>;
620def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRHpre)>;
621def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroW)>;
622def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroX)>;
623def : InstRW<[A57Write_5cyc_1L], (instrs LDRHui)>;
624def : InstRW<[A57Write_5cyc_1L], (instrs LDRQl)>;
625def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRQpost)>;
626def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRQpre)>;
627def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroW)>;
628def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroX)>;
629def : InstRW<[A57Write_5cyc_1L], (instrs LDRQui)>;
630def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroW)>;
631def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroX)>;
632def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroW)>;
633def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroX)>;
634def : InstRW<[A57Write_5cyc_1L], (instrs LDRSl)>;
635def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRSpost)>;
636def : InstRW<[A57Write_5cyc_1L, WriteAdr], (instrs LDRSpre)>;
637def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroW)>;
638def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroX)>;
639def : InstRW<[A57Write_5cyc_1L], (instrs LDRSui)>;
640def : InstRW<[A57Write_5cyc_1L], (instrs LDURBi)>;
641def : InstRW<[A57Write_5cyc_1L], (instrs LDURDi)>;
642def : InstRW<[A57Write_5cyc_1L], (instrs LDURHi)>;
643def : InstRW<[A57Write_5cyc_1L], (instrs LDURQi)>;
644def : InstRW<[A57Write_5cyc_1L], (instrs LDURSi)>;
645
646def : InstRW<[A57Write_2cyc_2S], (instrs STNPDi)>;
647def : InstRW<[A57Write_4cyc_1I_4S], (instrs STNPQi)>;
648def : InstRW<[A57Write_2cyc_2S], (instrs STNPXi)>;
649def : InstRW<[A57Write_2cyc_2S], (instrs STPDi)>;
650def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpost)>;
651def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpre)>;
652def : InstRW<[A57Write_4cyc_1I_4S], (instrs STPQi)>;
653def : InstRW<[WriteAdr, A57Write_4cyc_1I_4S], (instrs STPQpost)>;
654def : InstRW<[WriteAdr, A57Write_4cyc_2I_4S], (instrs STPQpre)>;
655def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpost)>;
656def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpre)>;
657def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpost)>;
658def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpre)>;
659def : InstRW<[A57Write_2cyc_2S], (instrs STPXi)>;
660def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpost)>;
661def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpre)>;
662def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpost)>;
663def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpre)>;
664def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBpost)>;
665def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRBpre)>;
666def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroW)>;
667def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroX)>;
668def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRDpost)>;
669def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRDpre)>;
670def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpost)>;
671def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpre)>;
672def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroW)>;
673def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroX)>;
674def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHpost)>;
675def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRHpre)>;
676def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroW)>;
677def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroX)>;
678def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQpost)>;
679def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STRQpre)>;
680def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroW)>;
681def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroX)>;
682def : InstRW<[A57Write_2cyc_1I_2S], (instrs STRQui)>;
683def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRSpost)>;
684def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRSpre)>;
685def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpost)>;
686def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpre)>;
687def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpost)>;
688def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpre)>;
689def : InstRW<[A57Write_2cyc_2S], (instrs STURQi)>;
690
691} // SchedModel = CortexA57Model
692