1//=- AArch64SchedA57.td - ARM Cortex-A57 Scheduling Defs -----*- tablegen -*-=// 2// 3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4// See https://llvm.org/LICENSE.txt for license information. 5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6// 7//===----------------------------------------------------------------------===// 8// 9// This file defines the machine model for ARM Cortex-A57 to support 10// instruction scheduling and other instruction cost heuristics. 11// 12//===----------------------------------------------------------------------===// 13 14//===----------------------------------------------------------------------===// 15// The Cortex-A57 is a traditional superscalar microprocessor with a 16// conservative 3-wide in-order stage for decode and dispatch. Combined with the 17// much wider out-of-order issue stage, this produced a need to carefully 18// schedule micro-ops so that all three decoded each cycle are successfully 19// issued as the reservation station(s) simply don't stay occupied for long. 20// Therefore, IssueWidth is set to the narrower of the two at three, while still 21// modeling the machine as out-of-order. 22 23def CortexA57Model : SchedMachineModel { 24 let IssueWidth = 3; // 3-way decode and dispatch 25 let MicroOpBufferSize = 128; // 128 micro-op re-order buffer 26 let LoadLatency = 4; // Optimistic load latency 27 let MispredictPenalty = 14; // Fetch + Decode/Rename/Dispatch + Branch 28 29 // Enable partial & runtime unrolling. The magic number is chosen based on 30 // experiments and benchmarking data. 31 let LoopMicroOpBufferSize = 16; 32 let CompleteModel = 1; 33 34 list<Predicate> UnsupportedFeatures = !listconcat(SVEUnsupported.F, 35 PAUnsupported.F, 36 SMEUnsupported.F, 37 [HasMTE, HasCSSC]); 38} 39 40//===----------------------------------------------------------------------===// 41// Define each kind of processor resource and number available on Cortex-A57. 42// Cortex A-57 has 8 pipelines that each has its own 8-entry queue where 43// micro-ops wait for their operands and then issue out-of-order. 44 45def A57UnitB : ProcResource<1>; // Type B micro-ops 46def A57UnitI : ProcResource<2>; // Type I micro-ops 47def A57UnitM : ProcResource<1>; // Type M micro-ops 48def A57UnitL : ProcResource<1>; // Type L micro-ops 49def A57UnitS : ProcResource<1>; // Type S micro-ops 50def A57UnitX : ProcResource<1>; // Type X micro-ops 51def A57UnitW : ProcResource<1>; // Type W micro-ops 52let SchedModel = CortexA57Model in { 53 def A57UnitV : ProcResGroup<[A57UnitX, A57UnitW]>; // Type V micro-ops 54} 55 56let SchedModel = CortexA57Model in { 57 58//===----------------------------------------------------------------------===// 59// Define customized scheduler read/write types specific to the Cortex-A57. 60 61include "AArch64SchedA57WriteRes.td" 62 63//===----------------------------------------------------------------------===// 64// Map the target-defined scheduler read/write resources and latency for 65// Cortex-A57. The Cortex-A57 types are directly associated with resources, so 66// defining the aliases precludes the need for mapping them using WriteRes. The 67// aliases are sufficient for creating a coarse, working model. As the model 68// evolves, InstRWs will be used to override some of these SchedAliases. 69// 70// WARNING: Using SchedAliases is convenient and works well for latency and 71// resource lookup for instructions. However, this creates an entry in 72// AArch64WriteLatencyTable with a WriteResourceID of 0, breaking 73// any SchedReadAdvance since the lookup will fail. 74 75def : SchedAlias<WriteImm, A57Write_1cyc_1I>; 76def : SchedAlias<WriteI, A57Write_1cyc_1I>; 77def : SchedAlias<WriteISReg, A57Write_2cyc_1M>; 78def : SchedAlias<WriteIEReg, A57Write_2cyc_1M>; 79def : SchedAlias<WriteExtr, A57Write_1cyc_1I>; 80def : SchedAlias<WriteIS, A57Write_1cyc_1I>; 81def : SchedAlias<WriteID32, A57Write_19cyc_1M>; 82def : SchedAlias<WriteID64, A57Write_35cyc_1M>; 83def : WriteRes<WriteIM32, [A57UnitM]> { let Latency = 3; } 84def : WriteRes<WriteIM64, [A57UnitM]> { let Latency = 5; } 85def : SchedAlias<WriteBr, A57Write_1cyc_1B>; 86def : SchedAlias<WriteBrReg, A57Write_1cyc_1B>; 87def : SchedAlias<WriteLD, A57Write_4cyc_1L>; 88def : SchedAlias<WriteST, A57Write_1cyc_1S>; 89def : SchedAlias<WriteSTP, A57Write_1cyc_1S>; 90def : SchedAlias<WriteAdr, A57Write_1cyc_1I>; 91def : SchedAlias<WriteLDIdx, A57Write_4cyc_1I_1L>; 92def : SchedAlias<WriteSTIdx, A57Write_1cyc_1I_1S>; 93def : SchedAlias<WriteF, A57Write_3cyc_1V>; 94def : SchedAlias<WriteFCmp, A57Write_3cyc_1V>; 95def : SchedAlias<WriteFCvt, A57Write_5cyc_1V>; 96def : SchedAlias<WriteFCopy, A57Write_5cyc_1L>; 97def : SchedAlias<WriteFImm, A57Write_3cyc_1V>; 98def : WriteRes<WriteFMul, [A57UnitV]> { let Latency = 5;} 99def : SchedAlias<WriteFDiv, A57Write_17cyc_1W>; 100def : SchedAlias<WriteVd, A57Write_3cyc_1V>; 101def : SchedAlias<WriteVq, A57Write_3cyc_1V>; 102def : SchedAlias<WriteVLD, A57Write_5cyc_1L>; 103def : SchedAlias<WriteVST, A57Write_1cyc_1S>; 104 105def : WriteRes<WriteAtomic, []> { let Unsupported = 1; } 106 107def : WriteRes<WriteSys, []> { let Latency = 1; } 108def : WriteRes<WriteBarrier, []> { let Latency = 1; } 109def : WriteRes<WriteHint, []> { let Latency = 1; } 110 111def : WriteRes<WriteLDHi, []> { let Latency = 4; } 112 113// Forwarding logic is only modeled for multiply and accumulate 114def : ReadAdvance<ReadI, 0>; 115def : ReadAdvance<ReadISReg, 0>; 116def : ReadAdvance<ReadIEReg, 0>; 117def : ReadAdvance<ReadIM, 0>; 118def : ReadAdvance<ReadIMA, 2, [WriteIM32, WriteIM64]>; 119def : ReadAdvance<ReadID, 0>; 120def : ReadAdvance<ReadExtrHi, 0>; 121def : ReadAdvance<ReadST, 0>; 122def : ReadAdvance<ReadAdrBase, 0>; 123def : ReadAdvance<ReadVLD, 0>; 124 125 126//===----------------------------------------------------------------------===// 127// Specialize the coarse model by associating instruction groups with the 128// subtarget-defined types. As the modeled is refined, this will override most 129// of the above ShchedAlias mappings. 130 131// Miscellaneous 132// ----------------------------------------------------------------------------- 133 134def : InstRW<[WriteI], (instrs COPY)>; 135 136 137// Branch Instructions 138// ----------------------------------------------------------------------------- 139 140def : InstRW<[A57Write_1cyc_1B_1I], (instrs BL)>; 141def : InstRW<[A57Write_2cyc_1B_1I], (instrs BLR)>; 142 143 144// Shifted Register with Shift == 0 145// ---------------------------------------------------------------------------- 146 147def A57WriteISReg : SchedWriteVariant<[ 148 SchedVar<RegShiftedPred, [WriteISReg]>, 149 SchedVar<NoSchedPred, [WriteI]>]>; 150def : InstRW<[A57WriteISReg], (instregex ".*rs$")>; 151 152 153// Divide and Multiply Instructions 154// ----------------------------------------------------------------------------- 155 156// Multiply high 157def : InstRW<[A57Write_6cyc_1M], (instrs SMULHrr, UMULHrr)>; 158 159 160// Miscellaneous Data-Processing Instructions 161// ----------------------------------------------------------------------------- 162 163def : InstRW<[A57Write_1cyc_1I], (instrs EXTRWrri)>; 164def : InstRW<[A57Write_3cyc_1I_1M], (instrs EXTRXrri)>; 165def : InstRW<[A57Write_2cyc_1M], (instregex "BFM")>; 166 167 168// Cryptography Extensions 169// ----------------------------------------------------------------------------- 170 171def A57ReadAES : SchedReadAdvance<3, [A57Write_3cyc_1W]>; 172def : InstRW<[A57Write_3cyc_1W], (instregex "^AES[DE]")>; 173def : InstRW<[A57Write_3cyc_1W, A57ReadAES], (instregex "^AESI?MC")>; 174def : InstRW<[A57Write_6cyc_2V], (instregex "^SHA1SU0")>; 175def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA1(H|SU1)")>; 176def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA1[CMP]")>; 177def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA256SU0")>; 178def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA256(H|H2|SU1)")>; 179def : InstRW<[A57Write_3cyc_1W], (instregex "^CRC32")>; 180 181 182// Vector Load 183// ----------------------------------------------------------------------------- 184 185def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1i(8|16|32)$")>; 186def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD1i(8|16|32)_POST$")>; 187def : InstRW<[A57Write_5cyc_1L], (instregex "LD1i(64)$")>; 188def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1i(64)_POST$")>; 189 190def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1Rv(8b|4h|2s)$")>; 191def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD1Rv(8b|4h|2s)_POST$")>; 192def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Rv(1d)$")>; 193def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Rv(1d)_POST$")>; 194def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1Rv(16b|8h|4s|2d)$")>; 195def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD1Rv(16b|8h|4s|2d)_POST$")>; 196 197def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Onev(8b|4h|2s|1d)$")>; 198def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Onev(8b|4h|2s|1d)_POST$")>; 199def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Onev(16b|8h|4s|2d)$")>; 200def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Onev(16b|8h|4s|2d)_POST$")>; 201def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Twov(8b|4h|2s|1d)$")>; 202def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Twov(8b|4h|2s|1d)_POST$")>; 203def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Twov(16b|8h|4s|2d)$")>; 204def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD1Twov(16b|8h|4s|2d)_POST$")>; 205def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Threev(8b|4h|2s|1d)$")>; 206def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD1Threev(8b|4h|2s|1d)_POST$")>; 207def : InstRW<[A57Write_7cyc_3L], (instregex "LD1Threev(16b|8h|4s|2d)$")>; 208def : InstRW<[WriteAdr, A57Write_7cyc_3L], (instregex "LD1Threev(16b|8h|4s|2d)_POST$")>; 209def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Fourv(8b|4h|2s|1d)$")>; 210def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD1Fourv(8b|4h|2s|1d)_POST$")>; 211def : InstRW<[A57Write_8cyc_4L], (instregex "LD1Fourv(16b|8h|4s|2d)$")>; 212def : InstRW<[WriteAdr, A57Write_8cyc_4L], (instregex "LD1Fourv(16b|8h|4s|2d)_POST$")>; 213 214def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD2i(8|16)$")>; 215def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD2i(8|16)_POST$")>; 216def : InstRW<[A57Write_6cyc_2L], (instregex "LD2i(32)$")>; 217def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD2i(32)_POST$")>; 218def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2i(64)$")>; 219def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD2i(64)_POST$")>; 220 221def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2Rv(8b|4h|2s)$")>; 222def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD2Rv(8b|4h|2s)_POST$")>; 223def : InstRW<[A57Write_5cyc_1L], (instregex "LD2Rv(1d)$")>; 224def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD2Rv(1d)_POST$")>; 225def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD2Rv(16b|8h|4s|2d)$")>; 226def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD2Rv(16b|8h|4s|2d)_POST$")>; 227 228def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2Twov(8b|4h|2s)$")>; 229def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD2Twov(8b|4h|2s)_POST$")>; 230def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD2Twov(16b|8h|4s)$")>; 231def : InstRW<[WriteAdr, A57Write_9cyc_2L_2V], (instregex "LD2Twov(16b|8h|4s)_POST$")>; 232def : InstRW<[A57Write_6cyc_2L], (instregex "LD2Twov(2d)$")>; 233def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD2Twov(2d)_POST$")>; 234 235def : InstRW<[A57Write_9cyc_1L_3V], (instregex "LD3i(8|16)$")>; 236def : InstRW<[WriteAdr, A57Write_9cyc_1L_3V], (instregex "LD3i(8|16)_POST$")>; 237def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD3i(32)$")>; 238def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD3i(32)_POST$")>; 239def : InstRW<[A57Write_6cyc_2L], (instregex "LD3i(64)$")>; 240def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD3i(64)_POST$")>; 241 242def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD3Rv(8b|4h|2s)$")>; 243def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD3Rv(8b|4h|2s)_POST$")>; 244def : InstRW<[A57Write_6cyc_2L], (instregex "LD3Rv(1d)$")>; 245def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD3Rv(1d)_POST$")>; 246def : InstRW<[A57Write_9cyc_1L_3V], (instregex "LD3Rv(16b|8h|4s)$")>; 247def : InstRW<[WriteAdr, A57Write_9cyc_1L_3V], (instregex "LD3Rv(16b|8h|4s)_POST$")>; 248def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD3Rv(2d)$")>; 249def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD3Rv(2d)_POST$")>; 250 251def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD3Threev(8b|4h|2s)$")>; 252def : InstRW<[WriteAdr, A57Write_9cyc_2L_2V], (instregex "LD3Threev(8b|4h|2s)_POST$")>; 253def : InstRW<[A57Write_10cyc_3L_4V], (instregex "LD3Threev(16b|8h|4s)$")>; 254def : InstRW<[WriteAdr, A57Write_10cyc_3L_4V], (instregex "LD3Threev(16b|8h|4s)_POST$")>; 255def : InstRW<[A57Write_8cyc_4L], (instregex "LD3Threev(2d)$")>; 256def : InstRW<[WriteAdr, A57Write_8cyc_4L], (instregex "LD3Threev(2d)_POST$")>; 257 258def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4i(8|16)$")>; 259def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD4i(8|16)_POST$")>; 260def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD4i(32)$")>; 261def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD4i(32)_POST$")>; 262def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4i(64)$")>; 263def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD4i(64)_POST$")>; 264 265def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD4Rv(8b|4h|2s)$")>; 266def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD4Rv(8b|4h|2s)_POST$")>; 267def : InstRW<[A57Write_6cyc_2L], (instregex "LD4Rv(1d)$")>; 268def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD4Rv(1d)_POST$")>; 269def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4Rv(16b|8h|4s)$")>; 270def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD4Rv(16b|8h|4s)_POST$")>; 271def : InstRW<[A57Write_9cyc_2L_4V], (instregex "LD4Rv(2d)$")>; 272def : InstRW<[WriteAdr, A57Write_9cyc_2L_4V], (instregex "LD4Rv(2d)_POST$")>; 273 274def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD4Fourv(8b|4h|2s)$")>; 275def : InstRW<[WriteAdr, A57Write_9cyc_2L_2V], (instregex "LD4Fourv(8b|4h|2s)_POST$")>; 276def : InstRW<[A57Write_11cyc_4L_4V], (instregex "LD4Fourv(16b|8h|4s)$")>; 277def : InstRW<[WriteAdr, A57Write_11cyc_4L_4V], (instregex "LD4Fourv(16b|8h|4s)_POST$")>; 278def : InstRW<[A57Write_8cyc_4L], (instregex "LD4Fourv(2d)$")>; 279def : InstRW<[WriteAdr, A57Write_8cyc_4L], (instregex "LD4Fourv(2d)_POST$")>; 280 281// Vector Store 282// ----------------------------------------------------------------------------- 283 284def : InstRW<[A57Write_1cyc_1S], (instregex "ST1i(8|16|32)$")>; 285def : InstRW<[WriteAdr, A57Write_1cyc_1S], (instregex "ST1i(8|16|32)_POST$")>; 286def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST1i(64)$")>; 287def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST1i(64)_POST$")>; 288 289def : InstRW<[A57Write_1cyc_1S], (instregex "ST1Onev(8b|4h|2s|1d)$")>; 290def : InstRW<[WriteAdr, A57Write_1cyc_1S], (instregex "ST1Onev(8b|4h|2s|1d)_POST$")>; 291def : InstRW<[A57Write_2cyc_2S], (instregex "ST1Onev(16b|8h|4s|2d)$")>; 292def : InstRW<[WriteAdr, A57Write_2cyc_2S], (instregex "ST1Onev(16b|8h|4s|2d)_POST$")>; 293def : InstRW<[A57Write_2cyc_2S], (instregex "ST1Twov(8b|4h|2s|1d)$")>; 294def : InstRW<[WriteAdr, A57Write_2cyc_2S], (instregex "ST1Twov(8b|4h|2s|1d)_POST$")>; 295def : InstRW<[A57Write_4cyc_4S], (instregex "ST1Twov(16b|8h|4s|2d)$")>; 296def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST1Twov(16b|8h|4s|2d)_POST$")>; 297def : InstRW<[A57Write_3cyc_3S], (instregex "ST1Threev(8b|4h|2s|1d)$")>; 298def : InstRW<[WriteAdr, A57Write_3cyc_3S], (instregex "ST1Threev(8b|4h|2s|1d)_POST$")>; 299def : InstRW<[A57Write_6cyc_6S], (instregex "ST1Threev(16b|8h|4s|2d)$")>; 300def : InstRW<[WriteAdr, A57Write_6cyc_6S], (instregex "ST1Threev(16b|8h|4s|2d)_POST$")>; 301def : InstRW<[A57Write_4cyc_4S], (instregex "ST1Fourv(8b|4h|2s|1d)$")>; 302def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST1Fourv(8b|4h|2s|1d)_POST$")>; 303def : InstRW<[A57Write_8cyc_8S], (instregex "ST1Fourv(16b|8h|4s|2d)$")>; 304def : InstRW<[WriteAdr, A57Write_8cyc_8S], (instregex "ST1Fourv(16b|8h|4s|2d)_POST$")>; 305 306def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST2i(8|16|32)$")>; 307def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST2i(8|16|32)_POST$")>; 308def : InstRW<[A57Write_2cyc_2S], (instregex "ST2i(64)$")>; 309def : InstRW<[WriteAdr, A57Write_2cyc_2S], (instregex "ST2i(64)_POST$")>; 310 311def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST2Twov(8b|4h|2s)$")>; 312def : InstRW<[WriteAdr, A57Write_3cyc_2S_1V], (instregex "ST2Twov(8b|4h|2s)_POST$")>; 313def : InstRW<[A57Write_4cyc_4S_2V], (instregex "ST2Twov(16b|8h|4s)$")>; 314def : InstRW<[WriteAdr, A57Write_4cyc_4S_2V], (instregex "ST2Twov(16b|8h|4s)_POST$")>; 315def : InstRW<[A57Write_4cyc_4S], (instregex "ST2Twov(2d)$")>; 316def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST2Twov(2d)_POST$")>; 317 318def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST3i(8|16)$")>; 319def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST3i(8|16)_POST$")>; 320def : InstRW<[A57Write_3cyc_3S], (instregex "ST3i(32)$")>; 321def : InstRW<[WriteAdr, A57Write_3cyc_3S], (instregex "ST3i(32)_POST$")>; 322def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST3i(64)$")>; 323def : InstRW<[WriteAdr, A57Write_3cyc_2S_1V], (instregex "ST3i(64)_POST$")>; 324 325def : InstRW<[A57Write_3cyc_3S_2V], (instregex "ST3Threev(8b|4h|2s)$")>; 326def : InstRW<[WriteAdr, A57Write_3cyc_3S_2V], (instregex "ST3Threev(8b|4h|2s)_POST$")>; 327def : InstRW<[A57Write_6cyc_6S_4V], (instregex "ST3Threev(16b|8h|4s)$")>; 328def : InstRW<[WriteAdr, A57Write_6cyc_6S_4V], (instregex "ST3Threev(16b|8h|4s)_POST$")>; 329def : InstRW<[A57Write_6cyc_6S], (instregex "ST3Threev(2d)$")>; 330def : InstRW<[WriteAdr, A57Write_6cyc_6S], (instregex "ST3Threev(2d)_POST$")>; 331 332def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST4i(8|16)$")>; 333def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST4i(8|16)_POST$")>; 334def : InstRW<[A57Write_4cyc_4S], (instregex "ST4i(32)$")>; 335def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST4i(32)_POST$")>; 336def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST4i(64)$")>; 337def : InstRW<[WriteAdr, A57Write_3cyc_2S_1V], (instregex "ST4i(64)_POST$")>; 338 339def : InstRW<[A57Write_4cyc_4S_2V], (instregex "ST4Fourv(8b|4h|2s)$")>; 340def : InstRW<[WriteAdr, A57Write_4cyc_4S_2V], (instregex "ST4Fourv(8b|4h|2s)_POST$")>; 341def : InstRW<[A57Write_8cyc_8S_4V], (instregex "ST4Fourv(16b|8h|4s)$")>; 342def : InstRW<[WriteAdr, A57Write_8cyc_8S_4V], (instregex "ST4Fourv(16b|8h|4s)_POST$")>; 343def : InstRW<[A57Write_8cyc_8S], (instregex "ST4Fourv(2d)$")>; 344def : InstRW<[WriteAdr, A57Write_8cyc_8S], (instregex "ST4Fourv(2d)_POST$")>; 345 346// Vector - Integer 347// ----------------------------------------------------------------------------- 348 349// Reference for forms in this group 350// D form - v8i8, v4i16, v2i32 351// Q form - v16i8, v8i16, v4i32 352// D form - v1i8, v1i16, v1i32, v1i64 353// Q form - v16i8, v8i16, v4i32, v2i64 354// D form - v8i8_v8i16, v4i16_v4i32, v2i32_v2i64 355// Q form - v16i8_v8i16, v8i16_v4i32, v4i32_v2i64 356 357// Cortex A57 Software Optimization Guide Sec 3.14 358// Advance for absolute diff accum, pairwise add and accumulate, shift accumulate 359def A57ReadIVA3 : SchedReadAdvance<3, [A57Write_4cyc_1X_NonMul_Forward, A57Write_5cyc_2X_NonMul_Forward]>; 360 361// ASIMD absolute diff accum, D-form 362def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v8i8|v4i16|v2i32)$")>; 363// ASIMD absolute diff accum, Q-form 364def : InstRW<[A57Write_5cyc_2X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v16i8|v8i16|v4i32)$")>; 365// ASIMD absolute diff accum long 366def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABAL")>; 367 368// ASIMD arith, reduce, 4H/4S 369def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?ADDL?V(v8i8|v4i16|v2i32)v$")>; 370// ASIMD arith, reduce, 8B/8H 371def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU]?ADDL?V(v8i16|v4i32)v$")>; 372// ASIMD arith, reduce, 16B 373def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU]?ADDL?Vv16i8v$")>; 374 375// ASIMD max/min, reduce, 4H/4S 376def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU](MIN|MAX)V(v4i16|v4i32)v$")>; 377// ASIMD max/min, reduce, 8B/8H 378def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU](MIN|MAX)V(v8i8|v8i16)v$")>; 379// ASIMD max/min, reduce, 16B 380def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU](MIN|MAX)Vv16i8v$")>; 381 382// ASIMD multiply, D-form 383// MUL 384def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^MUL(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>; 385// PMUL, SQDMULH, SQRDMULH 386def : InstRW<[A57Write_5cyc_1W], (instregex "^(PMUL|SQR?DMULH)(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>; 387 388// ASIMD multiply, Q-form 389// MUL 390def : InstRW<[A57Write_6cyc_2W_Mul_Forward], (instregex "^MUL(v16i8|v8i16|v4i32)(_indexed)?$")>; 391// PMUL, SQDMULH, SQRDMULH 392def : InstRW<[A57Write_6cyc_2W], (instregex "^(PMUL|SQR?DMULH)(v16i8|v8i16|v4i32)(_indexed)?$")>; 393 394// Cortex A57 Software Optimization Guide Sec 3.14 395def A57ReadIVMA4 : SchedReadAdvance<4 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>; 396def A57ReadIVMA3 : SchedReadAdvance<3 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>; 397 398// ASIMD multiply accumulate, D-form 399def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v8i8|v4i16|v2i32)(_indexed)?$")>; 400// ASIMD multiply accumulate, Q-form 401def : InstRW<[A57Write_6cyc_2W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v16i8|v8i16|v4i32)(_indexed)?$")>; 402 403// ASIMD multiply accumulate long 404// ASIMD multiply accumulate saturating long 405def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^(S|U)ML[AS]L")>; 406def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA3], (instregex "^SQDML[AS]L")>; 407 408// ASIMD multiply long 409def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^(S|U)MULL")>; 410def : InstRW<[A57Write_5cyc_1W], (instregex "^SQDMULL")>; 411def : InstRW<[A57Write_5cyc_1W], (instregex "^PMULL(v8i8|v16i8)")>; 412def : InstRW<[A57Write_3cyc_1W], (instregex "^PMULL(v1i64|v2i64)")>; 413 414// ASIMD pairwise add and accumulate 415// ASIMD shift accumulate 416def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ADALP")>; 417def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^(S|SR|U|UR)SRA")>; 418 419// ASIMD shift by immed, complex 420def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?(Q|R){1,2}SHR")>; 421def : InstRW<[A57Write_4cyc_1X], (instregex "^SQSHLU")>; 422 423 424// ASIMD shift by register, basic, Q-form 425def : InstRW<[A57Write_4cyc_2X], (instregex "^[SU]SHL(v16i8|v8i16|v4i32|v2i64)")>; 426 427// ASIMD shift by register, complex, D-form 428def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU][QR]{1,2}SHL(v1i8|v1i16|v1i32|v1i64|v8i8|v4i16|v2i32|b|d|h|s)")>; 429 430// ASIMD shift by register, complex, Q-form 431def : InstRW<[A57Write_5cyc_2X], (instregex "^[SU][QR]{1,2}SHL(v16i8|v8i16|v4i32|v2i64)")>; 432 433 434// Vector - Floating Point 435// ----------------------------------------------------------------------------- 436 437// Reference for forms in this group 438// D form - v2f32 439// Q form - v4f32, v2f64 440// D form - 32, 64 441// D form - v1i32, v1i64 442// D form - v2i32 443// Q form - v4i32, v2i64 444 445// ASIMD FP arith, normal, D-form 446def : InstRW<[A57Write_5cyc_1V], (instregex "^(FABD|FADD|FSUB)(v2f32|32|64|v2i32p)")>; 447// ASIMD FP arith, normal, Q-form 448def : InstRW<[A57Write_5cyc_2V], (instregex "^(FABD|FADD|FSUB)(v4f32|v2f64|v2i64p)")>; 449 450// ASIMD FP arith, pairwise, D-form 451def : InstRW<[A57Write_5cyc_1V], (instregex "^FADDP(v2f32|32|64|v2i32)")>; 452// ASIMD FP arith, pairwise, Q-form 453def : InstRW<[A57Write_9cyc_3V], (instregex "^FADDP(v4f32|v2f64|v2i64)")>; 454 455// ASIMD FP compare, D-form 456def : InstRW<[A57Write_5cyc_1V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v2f32|32|64|v1i32|v2i32|v1i64)")>; 457// ASIMD FP compare, Q-form 458def : InstRW<[A57Write_5cyc_2V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v4f32|v2f64|v4i32|v2i64)")>; 459 460// ASIMD FP convert, long and narrow 461def : InstRW<[A57Write_8cyc_3V], (instregex "^FCVT(L|N|XN)v")>; 462// ASIMD FP convert, other, D-form 463def : InstRW<[A57Write_5cyc_1V], (instregex "^[FSU]CVT([AMNPZ][SU])?(_Int)?(v2f32|v1i32|v2i32|v1i64)")>; 464// ASIMD FP convert, other, Q-form 465def : InstRW<[A57Write_5cyc_2V], (instregex "^[FSU]CVT([AMNPZ][SU])?(_Int)?(v4f32|v2f64|v4i32|v2i64)")>; 466 467// ASIMD FP divide, D-form, F32 468def : InstRW<[A57Write_17cyc_1W], (instregex "FDIVv2f32")>; 469// ASIMD FP divide, Q-form, F32 470def : InstRW<[A57Write_34cyc_2W], (instregex "FDIVv4f32")>; 471// ASIMD FP divide, Q-form, F64 472def : InstRW<[A57Write_64cyc_2W], (instregex "FDIVv2f64")>; 473 474// Note: These were simply duplicated from ASIMD FDIV because of missing documentation 475// ASIMD FP square root, D-form, F32 476def : InstRW<[A57Write_17cyc_1W], (instregex "FSQRTv2f32")>; 477// ASIMD FP square root, Q-form, F32 478def : InstRW<[A57Write_34cyc_2W], (instregex "FSQRTv4f32")>; 479// ASIMD FP square root, Q-form, F64 480def : InstRW<[A57Write_64cyc_2W], (instregex "FSQRTv2f64")>; 481 482// ASIMD FP max/min, normal, D-form 483def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?(v2f32)")>; 484// ASIMD FP max/min, normal, Q-form 485def : InstRW<[A57Write_5cyc_2V], (instregex "^(FMAX|FMIN)(NM)?(v4f32|v2f64)")>; 486// ASIMD FP max/min, pairwise, D-form 487def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?P(v2f32|v2i32)")>; 488// ASIMD FP max/min, pairwise, Q-form 489def : InstRW<[A57Write_9cyc_3V], (instregex "^(FMAX|FMIN)(NM)?P(v4f32|v2f64|v2i64)")>; 490// ASIMD FP max/min, reduce 491def : InstRW<[A57Write_10cyc_3V], (instregex "^(FMAX|FMIN)(NM)?Vv")>; 492 493// ASIMD FP multiply, D-form, FZ 494def : InstRW<[A57Write_5cyc_1V_FP_Forward], (instregex "^FMULX?(v2f32|v1i32|v2i32|v1i64|32|64)")>; 495// ASIMD FP multiply, Q-form, FZ 496def : InstRW<[A57Write_5cyc_2V_FP_Forward], (instregex "^FMULX?(v4f32|v2f64|v4i32|v2i64)")>; 497 498// ASIMD FP multiply accumulate, D-form, FZ 499// ASIMD FP multiply accumulate, Q-form, FZ 500def A57WriteFPVMAD : SchedWriteRes<[A57UnitV]> { let Latency = 9; } 501def A57WriteFPVMAQ : SchedWriteRes<[A57UnitV, A57UnitV]> { let Latency = 10; } 502 503// Cortex A57 Software Optimization Guide Sec 3.15 504// Advances from FP mul and mul-accum to mul-accum 505def A57ReadFPVMA5 : SchedReadAdvance<5, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>; 506def A57ReadFPVMA6 : SchedReadAdvance<6, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>; 507 508def : InstRW<[A57WriteFPVMAD, A57ReadFPVMA5], (instregex "^FML[AS](v2f32|v1i32|v2i32|v1i64)")>; 509def : InstRW<[A57WriteFPVMAQ, A57ReadFPVMA6], (instregex "^FML[AS](v4f32|v2f64|v4i32|v2i64)")>; 510 511// ASIMD FP round, D-form 512def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT[AIMNPXZ](v2f32)")>; 513// ASIMD FP round, Q-form 514def : InstRW<[A57Write_5cyc_2V], (instregex "^FRINT[AIMNPXZ](v4f32|v2f64)")>; 515 516 517// Vector - Miscellaneous 518// ----------------------------------------------------------------------------- 519 520// Reference for forms in this group 521// D form - v8i8, v4i16, v2i32 522// Q form - v16i8, v8i16, v4i32 523// D form - v1i8, v1i16, v1i32, v1i64 524// Q form - v16i8, v8i16, v4i32, v2i64 525 526// ASIMD bitwise insert, Q-form 527def : InstRW<[A57Write_3cyc_2V], (instregex "^(BIF|BIT|BSL|BSP)v16i8")>; 528 529// ASIMD duplicate, gen reg, D-form and Q-form 530def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUP(i8|i16|i32|i64)$")>; 531def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUPv.+gpr")>; 532 533// ASIMD move, saturating 534def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]QXTU?N")>; 535 536// ASIMD reciprocal estimate, D-form 537def : InstRW<[A57Write_5cyc_1V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f32|v1i32|v2i32|v1i64)")>; 538// ASIMD reciprocal estimate, Q-form 539def : InstRW<[A57Write_5cyc_2V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f64|v4f32|v4i32)")>; 540 541// ASIMD reciprocal step, D-form, FZ 542def : InstRW<[A57Write_9cyc_1V], (instregex "^F(RECP|RSQRT)S(v2f32|v1i32|v2i32|v1i64|32|64)")>; 543// ASIMD reciprocal step, Q-form, FZ 544def : InstRW<[A57Write_9cyc_2V], (instregex "^F(RECP|RSQRT)S(v2f64|v4f32|v4i32)")>; 545 546// ASIMD table lookup, D-form 547def : InstRW<[A57Write_3cyc_1V], (instregex "^TB[LX]v8i8One")>; 548def : InstRW<[A57Write_6cyc_2V], (instregex "^TB[LX]v8i8Two")>; 549def : InstRW<[A57Write_9cyc_3V], (instregex "^TB[LX]v8i8Three")>; 550def : InstRW<[A57Write_12cyc_4V], (instregex "^TB[LX]v8i8Four")>; 551// ASIMD table lookup, Q-form 552def : InstRW<[A57Write_6cyc_3V], (instregex "^TB[LX]v16i8One")>; 553def : InstRW<[A57Write_9cyc_5V], (instregex "^TB[LX]v16i8Two")>; 554def : InstRW<[A57Write_12cyc_7V], (instregex "^TB[LX]v16i8Three")>; 555def : InstRW<[A57Write_15cyc_9V], (instregex "^TB[LX]v16i8Four")>; 556 557// ASIMD transfer, element to gen reg 558def : InstRW<[A57Write_6cyc_1I_1L], (instregex "^[SU]MOVv")>; 559 560// ASIMD transfer, gen reg to element 561def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^INSv")>; 562 563// ASIMD unzip/zip, Q-form 564def : InstRW<[A57Write_6cyc_3V], (instregex "^(UZP|ZIP)(1|2)(v16i8|v8i16|v4i32|v2i64)")>; 565 566 567// Remainder 568// ----------------------------------------------------------------------------- 569 570def : InstRW<[A57Write_5cyc_1V], (instregex "^F(ADD|SUB)[DS]rr")>; 571 572// Cortex A57 Software Optimization Guide Sec 3.10 573def A57WriteFPMA : SchedWriteRes<[A57UnitV]> { let Latency = 9; } 574def A57ReadFPMA5 : SchedReadAdvance<5, [A57WriteFPMA, WriteFMul]>; 575def A57ReadFPM : SchedReadAdvance<0>; 576def : InstRW<[A57WriteFPMA, A57ReadFPM, A57ReadFPM, A57ReadFPMA5], (instregex "^FN?M(ADD|SUB)[DS]rrr")>; 577 578def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[FSU]CVT[AMNPZ][SU](_Int)?[SU]?[XW]?[DS]?[rds]i?")>; 579def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[SU]CVTF")>; 580 581def : InstRW<[A57Write_32cyc_1W], (instrs FDIVDrr)>; 582def : InstRW<[A57Write_17cyc_1W], (instrs FDIVSrr)>; 583 584def : InstRW<[A57Write_5cyc_1V], (instregex "^F(MAX|MIN).+rr")>; 585 586def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT.+r")>; 587 588def : InstRW<[A57Write_32cyc_1W], (instrs FSQRTDr)>; 589def : InstRW<[A57Write_17cyc_1W], (instrs FSQRTSr)>; 590 591def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPDi)>; 592def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDNPQi)>; 593def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPSi)>; 594def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPDi)>; 595def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPDpost)>; 596def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPDpre)>; 597def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDPQi)>; 598def : InstRW<[WriteAdr, A57Write_6cyc_2L, WriteLDHi], (instrs LDPQpost)>; 599def : InstRW<[WriteAdr, A57Write_6cyc_2L, WriteLDHi], (instrs LDPQpre)>; 600def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWi)>; 601def : InstRW<[WriteAdr, A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWpost)>; 602def : InstRW<[WriteAdr, A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWpre)>; 603def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPSi)>; 604def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPSpost)>; 605def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPSpre)>; 606def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRBpost)>; 607def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRBpre)>; 608def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroW)>; 609def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroX)>; 610def : InstRW<[A57Write_5cyc_1L], (instrs LDRBui)>; 611def : InstRW<[A57Write_5cyc_1L], (instrs LDRDl)>; 612def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRDpost)>; 613def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRDpre)>; 614def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroW)>; 615def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroX)>; 616def : InstRW<[A57Write_5cyc_1L], (instrs LDRDui)>; 617def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroW)>; 618def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroX)>; 619def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRHpost)>; 620def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRHpre)>; 621def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroW)>; 622def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroX)>; 623def : InstRW<[A57Write_5cyc_1L], (instrs LDRHui)>; 624def : InstRW<[A57Write_5cyc_1L], (instrs LDRQl)>; 625def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRQpost)>; 626def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRQpre)>; 627def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroW)>; 628def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroX)>; 629def : InstRW<[A57Write_5cyc_1L], (instrs LDRQui)>; 630def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroW)>; 631def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroX)>; 632def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroW)>; 633def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroX)>; 634def : InstRW<[A57Write_5cyc_1L], (instrs LDRSl)>; 635def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRSpost)>; 636def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRSpre)>; 637def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroW)>; 638def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroX)>; 639def : InstRW<[A57Write_5cyc_1L], (instrs LDRSui)>; 640def : InstRW<[A57Write_5cyc_1L], (instrs LDURBi)>; 641def : InstRW<[A57Write_5cyc_1L], (instrs LDURDi)>; 642def : InstRW<[A57Write_5cyc_1L], (instrs LDURHi)>; 643def : InstRW<[A57Write_5cyc_1L], (instrs LDURQi)>; 644def : InstRW<[A57Write_5cyc_1L], (instrs LDURSi)>; 645 646def : InstRW<[A57Write_2cyc_2S], (instrs STNPDi)>; 647def : InstRW<[A57Write_4cyc_1I_4S], (instrs STNPQi)>; 648def : InstRW<[A57Write_2cyc_2S], (instrs STNPXi)>; 649def : InstRW<[A57Write_2cyc_2S], (instrs STPDi)>; 650def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpost)>; 651def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpre)>; 652def : InstRW<[A57Write_4cyc_1I_4S], (instrs STPQi)>; 653def : InstRW<[WriteAdr, A57Write_4cyc_1I_4S], (instrs STPQpost)>; 654def : InstRW<[WriteAdr, A57Write_4cyc_2I_4S], (instrs STPQpre)>; 655def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpost)>; 656def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpre)>; 657def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpost)>; 658def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpre)>; 659def : InstRW<[A57Write_2cyc_2S], (instrs STPXi)>; 660def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpost)>; 661def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpre)>; 662def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpost)>; 663def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpre)>; 664def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBpost)>; 665def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRBpre)>; 666def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroW)>; 667def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroX)>; 668def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRDpost)>; 669def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRDpre)>; 670def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpost)>; 671def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpre)>; 672def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroW)>; 673def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroX)>; 674def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHpost)>; 675def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRHpre)>; 676def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroW)>; 677def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroX)>; 678def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQpost)>; 679def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STRQpre)>; 680def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroW)>; 681def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroX)>; 682def : InstRW<[A57Write_2cyc_1I_2S], (instrs STRQui)>; 683def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRSpost)>; 684def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRSpre)>; 685def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpost)>; 686def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpre)>; 687def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpost)>; 688def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpre)>; 689def : InstRW<[A57Write_2cyc_2S], (instrs STURQi)>; 690 691} // SchedModel = CortexA57Model 692