1//=- AArch64SchedThunderX3T110.td - Marvell ThunderX3 T110 ---*- tablegen -*-=// 2// 3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4// See https://llvm.org/LICENSE.txt for license information. 5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6// 7//===----------------------------------------------------------------------===// 8// 9// This file defines the scheduling model for Marvell ThunderX3T110 10// family of processors. 11// 12//===----------------------------------------------------------------------===// 13 14//===----------------------------------------------------------------------===// 15// Pipeline Description. 16 17def ThunderX3T110Model : SchedMachineModel { 18 let IssueWidth = 4; // 4 micro-ops dispatched at a time. 19 let MicroOpBufferSize = 70; // 70 entries in micro-op re-order buffer. 20 let LoadLatency = 4; // Optimistic load latency. 21 let MispredictPenalty = 12; // Extra cycles for mispredicted branch. 22 // Determined via a mix of micro-arch details and experimentation. 23 let LoopMicroOpBufferSize = 128; // FIXME: might be much bigger in TX3. 24 let PostRAScheduler = 1; // Using PostRA sched. 25 let CompleteModel = 1; 26 27 list<Predicate> UnsupportedFeatures = !listconcat(SVEUnsupported.F, 28 PAUnsupported.F, 29 SMEUnsupported.F, 30 [HasMTE]); 31 // FIXME: Remove when all errors have been fixed. 32 let FullInstRWOverlapCheck = 0; 33} 34 35let SchedModel = ThunderX3T110Model in { 36 37// Issue ports. 38 39// Port 0: ALU. 40def THX3T110P0 : ProcResource<1>; 41 42// Port 1: ALU. 43def THX3T110P1 : ProcResource<1>; 44 45// Port 2: ALU/Branch. 46def THX3T110P2 : ProcResource<1>; 47 48// Port 3: ALU/Branch. 49def THX3T110P3 : ProcResource<1>; 50 51// Port 4: Load/Store. 52def THX3T110P4 : ProcResource<1>; 53 54// Port 5: Load/store. 55def THX3T110P5 : ProcResource<1>; 56 57// Port 6: FP/Neon/SIMD/Crypto. 58def THX3T110P6FP0 : ProcResource<1>; 59 60// Port 7: FP/Neon/SIMD/Crypto. 61def THX3T110P7FP1 : ProcResource<1>; 62 63// Port 8: FP/Neon/SIMD/Crypto. 64def THX3T110P8FP2 : ProcResource<1>; 65 66// Port 9: FP/Neon/SIMD/Crypto. 67def THX3T110P9FP3 : ProcResource<1>; 68 69// Port 10: Store Data Unit. 70def THX3T110SD0 : ProcResource<1>; 71 72// Define groups for the functional units on each issue port. Each group 73// created will be used by a WriteRes. 74 75// Integer divide/mulhi micro-ops only on port I1. 76def THX3T110I1 : ProcResGroup<[THX3T110P1]>; 77 78// Branch micro-ops on ports I2/I3. 79def THX3T110I23 : ProcResGroup<[THX3T110P2, THX3T110P3]>; 80 81// Branch micro-ops on ports I1/I2/I3. 82def THX3T110I123 : ProcResGroup<[THX3T110P1, THX3T110P2, THX3T110P3]>; 83 84// Integer micro-ops on ports I0/I1/I2. 85def THX3T110I012 : ProcResGroup<[THX3T110P0, THX3T110P1, THX3T110P2]>; 86 87// Integer micro-ops on ports I0/I1/I2/I3. 88def THX3T110I0123 : ProcResGroup<[THX3T110P0, THX3T110P1, 89 THX3T110P2, THX3T110P3]>; 90 91// FP micro-ops on ports FP0/FP1/FP2/FP3. 92def THX3T110FP0123 : ProcResGroup<[THX3T110P6FP0, THX3T110P7FP1, 93 THX3T110P8FP2, THX3T110P9FP3]>; 94 95// FP micro-ops on ports FP2/FP3. 96def THX3T110FP23 : ProcResGroup<[THX3T110P8FP2, THX3T110P9FP3]>; 97 98// ASIMD micro-ops on ports FP0/FP1/FP2/FP3. 99def THX3T110SIMD : ProcResGroup<[THX3T110P6FP0, THX3T110P7FP1, 100 THX3T110P8FP2, THX3T110P9FP3]>; 101 102// Store data micro-ops only on port 10. 103def THX3T110SD : ProcResGroup<[THX3T110SD0]>; 104 105// Load/store micro-ops on ports P4/P5. 106def THX3T110LS : ProcResGroup<[THX3T110P4, THX3T110P5]>; 107 108// 70 entry unified scheduler. 109def THX3T110ANY: ProcResGroup<[THX3T110P0, THX3T110P1, THX3T110P2, 110 THX3T110P3, THX3T110P4, THX3T110P5, 111 THX3T110P6FP0, THX3T110P7FP1, 112 THX3T110P8FP2, THX3T110P9FP3]> { 113 let BufferSize = 70; 114} 115 116// Define commonly used write types for InstRW specializations. 117// All definitions follow the format: THX3T110Write_<NumCycles>Cyc_<Resources>. 118 119// 3 cycles on I1. 120def THX3T110Write_3Cyc_I1 : SchedWriteRes<[THX3T110I1]> { 121 let Latency = 3; 122 let NumMicroOps = 2; 123} 124 125// 4 cycles on I1. 126def THX3T110Write_4Cyc_I1 : SchedWriteRes<[THX3T110I1]> { 127 let Latency = 4; 128 let NumMicroOps = 2; 129} 130 131// 5 cycles on I1. 132def THX3T110Write_5Cyc_I1 : SchedWriteRes<[THX3T110I1]> { 133 let Latency = 5; 134 let NumMicroOps = 2; 135} 136 137// 7 cycles on I1. 138def THX3T110Write_7Cyc_I1 : SchedWriteRes<[THX3T110I1]> { 139 let Latency = 7; 140 let NumMicroOps = 3; 141} 142 143// 23 cycles on I1. 144def THX3T110Write_23Cyc_I1 : SchedWriteRes<[THX3T110I1]> { 145 let Latency = 23; 146 let ResourceCycles = [13, 23]; 147 let NumMicroOps = 4; 148} 149 150// 39 cycles on I1. 151def THX3T110Write_39Cyc_I1 : SchedWriteRes<[THX3T110I1]> { 152 let Latency = 39; 153 let ResourceCycles = [13, 39]; 154 let NumMicroOps = 4; 155} 156 157// 1 cycle on I2/I3 158def THX3T110Write_1Cyc_I23 : SchedWriteRes<[THX3T110I23]> { 159 let Latency = 1; 160 let NumMicroOps = 2; 161} 162 163// 8 cycles on I2/I3 164def THX3T110Write_8Cyc_I23 : SchedWriteRes<[THX3T110I23]> { 165 let Latency = 8; 166 let NumMicroOps = 3; 167} 168 169// 1 cycle on I1/I2/I3 170def THX3T110Write_1Cyc_I123 : SchedWriteRes<[THX3T110I123]> { 171 let Latency = 1; 172 let NumMicroOps = 2; 173} 174 175// 8 cycles on I1/I2/I3 176def THX3T110Write_8Cyc_I123 : SchedWriteRes<[THX3T110I123]> { 177 let Latency = 8; 178 let NumMicroOps = 3; 179} 180 181// 1 cycle on I0/I1/I2/I3. 182def THX3T110Write_1Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 183 let Latency = 1; 184 let NumMicroOps = 2; 185} 186 187// 2 cycles on I0/I1/I2/I3. 188def THX3T110Write_2Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 189 let Latency = 2; 190 let NumMicroOps = 2; 191} 192 193// 3 cycles on I0/I1/I2/I3. 194def THX3T110Write_3Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 195 let Latency = 3; 196 let NumMicroOps = 2; 197} 198 199// 4 cycles on I0/I1/I2/I3. 200def THX3T110Write_4Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 201 let Latency = 4; 202 let NumMicroOps = 3; 203} 204 205// 5 cycles on I0/I1/I2/I3. 206def THX3T110Write_5Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 207 let Latency = 5; 208 let NumMicroOps = 3; 209} 210 211// 6 cycles on I0/I1/I2/I3. 212def THX3T110Write_6Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 213 let Latency = 6; 214 let NumMicroOps = 3; 215} 216 217// 8 cycles on I0/I1/I2/I3. 218def THX3T110Write_8Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 219 let Latency = 8; 220 let NumMicroOps = 4; 221} 222 223// 13 cycles on I0/I1/I2/I3. 224def THX3T110Write_13Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 225 let Latency = 13; 226 let NumMicroOps = 3; 227} 228 229// 23 cycles on I0/I1/I2/I3. 230def THX3T110Write_23Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 231 let Latency = 23; 232 let NumMicroOps = 3; 233} 234 235// 39 cycles on I0/I1/I2/I3. 236def THX3T110Write_39Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> { 237 let Latency = 39; 238 let NumMicroOps = 3; 239} 240 241// 4 cycles on F2/F3. 242def THX3T110Write_4Cyc_F23 : SchedWriteRes<[THX3T110FP23]> { 243 let Latency = 4; 244 let NumMicroOps = 2; 245} 246 247// 5 cycles on F0/F1/F2/F3. 248def THX3T110Write_5Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 249 let Latency = 5; 250 let NumMicroOps = 2; 251} 252 253// 6 cycles on F0/F1/F2/F3. 254def THX3T110Write_6Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 255 let Latency = 6; 256 let NumMicroOps = 3; 257} 258 259// 7 cycles on F0/F1/F2/F3. 260def THX3T110Write_7Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 261 let Latency = 7; 262 let NumMicroOps = 3; 263} 264 265// 8 cycles on F0/F1/F2/F3. 266def THX3T110Write_8Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 267 let Latency = 8; 268 let NumMicroOps = 3; 269} 270 271// 10 cycles on F0/F1/F2/F3. 272def THX3T110Write_10Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 273 let Latency = 10; 274 let NumMicroOps = 3; 275} 276 277// 16 cycles on F0/F1/F2/F3. 278def THX3T110Write_16Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 279 let Latency = 16; 280 let NumMicroOps = 3; 281 let ResourceCycles = [8]; 282} 283 284// 23 cycles on F0/F1/F2/F3. 285def THX3T110Write_23Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> { 286 let Latency = 23; 287 let NumMicroOps = 3; 288 let ResourceCycles = [11]; 289} 290 291// 1 cycle on LS0/LS1. 292def THX3T110Write_1Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 293 let Latency = 1; 294 let NumMicroOps = 1; 295} 296 297// 2 cycles on LS0/LS1. 298def THX3T110Write_2Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 299 let Latency = 2; 300 let NumMicroOps = 2; 301} 302 303// 4 cycles on LS0/LS1. 304def THX3T110Write_4Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 305 let Latency = 4; 306 let NumMicroOps = 2; 307 let ResourceCycles = [2]; 308} 309 310// 5 cycles on LS0/LS1. 311def THX3T110Write_5Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 312 let Latency = 5; 313 let NumMicroOps = 3; 314} 315 316// 6 cycles on LS0/LS1. 317def THX3T110Write_6Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 318 let Latency = 6; 319 let NumMicroOps = 3; 320} 321 322// 4 + 5 cycles on LS0/LS1. 323// First resource is available after 4 cycles. 324// Second resource is available after 5 cycles. 325// Load vector pair, immed offset, Q-form [LDP/LDNP]. 326def THX3T110Write_4_5Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 327 let Latency = 4; 328 let NumMicroOps = 2; 329 let ResourceCycles = [4, 5]; 330} 331 332// 4 + 8 cycles on LS0/LS1. 333// First resource is available after 4 cycles. 334// Second resource is available after 8 cycles. 335// Load vector pair, immed offset, S/D-form [LDP/LDNP]. 336def THX3T110Write_4_8Cyc_LS01 : SchedWriteRes<[THX3T110LS]> { 337 let Latency = 4; 338 let NumMicroOps = 2; 339 let ResourceCycles = [4, 8]; 340} 341 342// 11 cycles on LS0/LS1 and I1. 343def THX3T110Write_11Cyc_LS01_I1 : 344 SchedWriteRes<[THX3T110LS, THX3T110I1]> { 345 let Latency = 11; 346 let NumMicroOps = 4; 347} 348 349// 1 cycles on LS0/LS1 and I0/I1/I2/I3. 350def THX3T110Write_1Cyc_LS01_I0123 : 351 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 352 let Latency = 1; 353 let NumMicroOps = 2; 354} 355 356// 1 cycles on LS0/LS1 and 2 of I0/I1/I2/I3. 357def THX3T110Write_1Cyc_LS01_I0123_I0123 : 358 SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> { 359 let Latency = 1; 360 let NumMicroOps = 3; 361} 362 363// 4 cycles on LS0/LS1 and I0/I1/I2/I3. 364def THX3T110Write_4Cyc_LS01_I0123 : 365 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 366 let Latency = 4; 367 let NumMicroOps = 3; 368} 369 370// 4 cycles on LS0/LS1 and 2 of I0/I1/I2/I3. 371def THX3T110Write_4Cyc_LS01_I0123_I0123 : 372 SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> { 373 let Latency = 4; 374 let NumMicroOps = 3; 375} 376 377// 5 cycles on LS0/LS1 and I0/I1/I2/I3. 378def THX3T110Write_5Cyc_LS01_I0123 : 379 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 380 let Latency = 5; 381 let NumMicroOps = 3; 382} 383 384// 5 cycles on LS0/LS1 and 2 of I0/I1/I2/I3. 385def THX3T110Write_5Cyc_LS01_I0123_I0123 : 386 SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> { 387 let Latency = 5; 388 let NumMicroOps = 3; 389} 390 391// 6 cycles on LS0/LS1 and I0/I1/I2/I3. 392def THX3T110Write_6Cyc_LS01_I012 : 393 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 394 let Latency = 6; 395 let NumMicroOps = 4; 396} 397 398// 6 cycles on LS0/LS1 and 2 of I0/I1/I2/I3. 399def THX3T110Write_6Cyc_LS01_I0123_I0123 : 400 SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> { 401 let Latency = 6; 402 let NumMicroOps = 3; 403} 404 405// 1 cycle on LS0/LS1 and SD. 406def THX3T110Write_1Cyc_LS01_SD : 407 SchedWriteRes<[THX3T110LS, THX3T110SD]> { 408 let Latency = 1; 409 let NumMicroOps = 2; 410} 411 412// 2 cycles on LS0/LS1 and SD. 413def THX3T110Write_2Cyc_LS01_SD : 414 SchedWriteRes<[THX3T110LS, THX3T110SD]> { 415 let Latency = 2; 416 let NumMicroOps = 2; 417} 418 419// 4 cycles on LS0/LS1 and SD. 420def THX3T110Write_4Cyc_LS01_SD : 421 SchedWriteRes<[THX3T110LS, THX3T110SD]> { 422 let Latency = 4; 423 let NumMicroOps = 3; 424} 425 426// 5 cycles on LS0/LS1 and SD. 427def THX3T110Write_5Cyc_LS01_SD : 428 SchedWriteRes<[THX3T110LS, THX3T110SD]> { 429 let Latency = 5; 430 let NumMicroOps = 4; 431} 432 433// 6 cycles on LS0/LS1 and SD. 434def THX3T110Write_6Cyc_LS01_SD : 435 SchedWriteRes<[THX3T110LS, THX3T110SD]> { 436 let Latency = 6; 437 let NumMicroOps = 5; 438} 439 440// 1 cycle on LS0/LS1, SD and I0/I1/I2/I3. 441def THX3T110Write_1Cyc_LS01_SD_I0123 : 442 SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> { 443 let Latency = 1; 444 let NumMicroOps = 2; 445} 446 447// 2 cycles on LS0/LS1, SD and I0/I1/I2/I3. 448def THX3T110Write_2Cyc_LS01_SD_I0123 : 449 SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> { 450 let Latency = 2; 451 let NumMicroOps = 2; 452} 453 454// 4 cycles on LS0/LS1, SD and I0/I1/I2/I3. 455def THX3T110Write_4Cyc_LS01_SD_I0123 : 456 SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> { 457 let Latency = 4; 458 let NumMicroOps = 3; 459} 460 461// 5 cycles on LS0/LS1, SD and I0/I1/I2/I3. 462def THX3T110Write_5Cyc_LS01_SD_I0123 : 463 SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> { 464 let Latency = 5; 465 let NumMicroOps = 4; 466} 467 468// 6 cycles on LS0/LS1, SD and I0/I1/I2/I3. 469def THX3T110Write_6Cyc_LS01_SD_I0123 : 470 SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> { 471 let Latency = 6; 472 let NumMicroOps = 5; 473} 474 475// 1 cycles on LS0/LS1 and F0/F1/F2/F3. 476def THX3T110Write_1Cyc_LS01_F0123 : 477 SchedWriteRes<[THX3T110LS, THX3T110FP0123]> { 478 let Latency = 1; 479 let NumMicroOps = 2; 480} 481 482// 5 cycles on LS0/LS1 and F0/F1/F2/F3. 483def THX3T110Write_5Cyc_LS01_F0123 : 484 SchedWriteRes<[THX3T110LS, THX3T110FP0123]> { 485 let Latency = 5; 486 let NumMicroOps = 3; 487} 488 489// 6 cycles on LS0/LS1 and F0/F1/F2/F3. 490def THX3T110Write_6Cyc_LS01_F0123 : 491 SchedWriteRes<[THX3T110LS, THX3T110FP0123]> { 492 let Latency = 6; 493 let NumMicroOps = 3; 494} 495 496// 7 cycles on LS0/LS1 and F0/F1/F2/F3. 497def THX3T110Write_7Cyc_LS01_F0123 : 498 SchedWriteRes<[THX3T110LS, THX3T110FP0123]> { 499 let Latency = 7; 500 let NumMicroOps = 3; 501} 502 503// 8 cycles on LS0/LS1 and F0/F1/F2/F3. 504def THX3T110Write_8Cyc_LS01_F0123 : 505 SchedWriteRes<[THX3T110LS, THX3T110FP0123]> { 506 let Latency = 8; 507 let NumMicroOps = 3; 508} 509 510// 8 cycles on LS0/LS1 and I0/I1/I2/I3. 511def THX3T110Write_8Cyc_LS01_I0123 : 512 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 513 let Latency = 8; 514 let NumMicroOps = 3; 515} 516 517// 12 cycles on LS0/LS1 and I0/I1/I2/I3. 518def THX3T110Write_12Cyc_LS01_I0123 : 519 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 520 let Latency = 12; 521 let NumMicroOps = 4; 522} 523 524// 16 cycles on LS0/LS1 and I0/I1/I2/I3. 525def THX3T110Write_16Cyc_LS01_I0123 : 526 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 527 let Latency = 16; 528 let NumMicroOps = 5; 529} 530 531// 24 cycles on LS0/LS1 and I0/I1/I2/I3. 532def THX3T110Write_24Cyc_LS01_I0123 : 533 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 534 let Latency = 24; 535 let NumMicroOps = 10; 536} 537 538// 32 cycles on LS0/LS1 and I0/I1/I2/I3. 539def THX3T110Write_32Cyc_LS01_I0123 : 540 SchedWriteRes<[THX3T110LS, THX3T110I0123]> { 541 let Latency = 32; 542 let NumMicroOps = 14; 543} 544 545// 3 cycles on F0/F1/F2/F3. 546def THX3T110Write_3Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 547 let Latency = 3; 548 let NumMicroOps = 2; 549} 550 551// 4 cycles on F0/F1/F2/F3. 552def THX3T110Write_4Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 553 let Latency = 4; 554 let NumMicroOps = 2; 555} 556 557// 5 cycles on F0/F1/F2/F3. 558def THX3T110Write_5Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 559 let Latency = 5; 560 let NumMicroOps = 2; 561} 562 563// 10 cycles on F0/F1/F2/F3. 564def THX3T110Write_10Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 565 let Latency = 10; 566 let NumMicroOps = 4; 567} 568 569// 15 cycles on F0/F1/F2/F3. 570def THX3T110Write_15Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 571 let Latency = 15; 572 let NumMicroOps = 7; 573} 574 575// 16 cycles on F0/F1/F2/F3. 576def THX3T110Write_16Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 577 let Latency = 16; 578 let NumMicroOps = 3; 579} 580 581// 18 cycles on F0/F1/F2/F3. 582def THX3T110Write_18Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 583 let Latency = 18; 584 let NumMicroOps = 3; 585} 586 587// 19 cycles on F0/F1/F2/F3. 588def THX3T110Write_19Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 589 let Latency = 19; 590 let NumMicroOps = 4; 591} 592 593// 20 cycles on F0/F1/F2/F3. 594def THX3T110Write_20Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 595 let Latency = 20; 596 let NumMicroOps = 4; 597} 598 599// 23 cycles on F0/F1/F2/F3. 600def THX3T110Write_23Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> { 601 let Latency = 23; 602 let NumMicroOps = 4; 603} 604 605// 3 cycles on F2/F3 and 4 cycles on F0/F1/F2/F3. 606def THX3T110Write_3_4Cyc_F23_F0123 : 607 SchedWriteRes<[THX3T110FP23, THX3T110FP0123]> { 608 let Latency = 3; 609 let NumMicroOps = 2; 610 let ResourceCycles = [3, 4]; 611} 612 613 614// Define commonly used read types. 615 616// No forwarding is provided for these types. 617def : ReadAdvance<ReadI, 0>; 618def : ReadAdvance<ReadISReg, 0>; 619def : ReadAdvance<ReadIEReg, 0>; 620def : ReadAdvance<ReadIM, 0>; 621def : ReadAdvance<ReadIMA, 0>; 622def : ReadAdvance<ReadID, 0>; 623def : ReadAdvance<ReadExtrHi, 0>; 624def : ReadAdvance<ReadAdrBase, 0>; 625def : ReadAdvance<ReadVLD, 0>; 626def : ReadAdvance<ReadST, 0>; 627 628//===----------------------------------------------------------------------===// 629// 3. Instruction Tables. 630 631//--- 632// 3.1 Branch Instructions 633//--- 634 635// Branch, immed 636// Branch and link, immed 637// Compare and branch 638def : WriteRes<WriteBr, [THX3T110I23]> { 639 let Latency = 1; 640 let NumMicroOps = 2; 641} 642 643// Branch, register 644// Branch and link, register != LR 645// Branch and link, register = LR 646def : WriteRes<WriteBrReg, [THX3T110I23]> { 647 let Latency = 1; 648 let NumMicroOps = 2; 649} 650 651def : WriteRes<WriteSys, []> { let Latency = 1; } 652def : WriteRes<WriteBarrier, []> { let Latency = 1; } 653def : WriteRes<WriteHint, []> { let Latency = 1; } 654 655def : WriteRes<WriteAtomic, []> { 656 let Latency = 4; 657 let NumMicroOps = 2; 658} 659 660//--- 661// Branch 662//--- 663def : InstRW<[THX3T110Write_1Cyc_I23], (instrs B, BL, BR, BLR)>; 664def : InstRW<[THX3T110Write_1Cyc_I23], (instrs Bcc)>; 665def : InstRW<[THX3T110Write_1Cyc_I23], (instrs RET)>; 666def : InstRW<[THX3T110Write_1Cyc_I23], 667 (instrs CBZW, CBZX, CBNZW, CBNZX, TBZW, TBZX, TBNZW, TBNZX)>; 668 669//--- 670// 3.2 Arithmetic and Logical Instructions 671// 3.3 Move and Shift Instructions 672//--- 673 674 675// ALU, basic 676// Conditional compare 677// Conditional select 678// Address generation 679def : WriteRes<WriteI, [THX3T110I0123]> { 680 let Latency = 1; 681 let ResourceCycles = [1]; 682 let NumMicroOps = 2; 683} 684 685def : InstRW<[WriteI], 686 (instregex "ADD?(W|X)r(i|r|s|x)", "ADDS?(W|X)r(i|r|s|x)(64)?", 687 "AND?(W|X)r(i|r|s|x)", "ANDS?(W|X)r(i|r|s|x)", 688 "ADC(W|X)r", 689 "BIC?(W|X)r(i|r|s|x)", "BICS?(W|X)r(i|r|s|x)", 690 "EON?(W|X)r(i|r|s|x)", "ORN?(W|X)r(i|r|s|x)", 691 "ORR?(W|X)r(i|r|s|x)", "SUB?(W|X)r(i|r|s|x)", 692 "SUBS?(W|X)r(i|r|s|x)", "SBC(W|X)r", 693 "SBCS(W|X)r", "CCMN(W|X)(i|r)", 694 "CCMP(W|X)(i|r)", "CSEL(W|X)r", 695 "CSINC(W|X)r", "CSINV(W|X)r", 696 "CSNEG(W|X)r")>; 697 698def : InstRW<[WriteI], (instrs COPY)>; 699 700// ALU, extend and/or shift 701def : WriteRes<WriteISReg, [THX3T110I0123]> { 702 let Latency = 2; 703 let ResourceCycles = [2]; 704 let NumMicroOps = 2; 705} 706 707def : InstRW<[WriteISReg], 708 (instregex "ADD?(W|X)r(i|r|s|x)", "ADDS?(W|X)r(i|r|s|x)(64)?", 709 "AND?(W|X)r(i|r|s|x)", "ANDS?(W|X)r(i|r|s|x)", 710 "ADC(W|X)r", 711 "BIC?(W|X)r(i|r|s|x)", "BICS?(W|X)r(i|r|s|x)", 712 "EON?(W|X)r(i|r|s|x)", "ORN?(W|X)r(i|r|s|x)", 713 "ORR?(W|X)r(i|r|s|x)", "SUB?(W|X)r(i|r|s|x)", 714 "SUBS?(W|X)r(i|r|s|x)", "SBC(W|X)r", 715 "SBCS(W|X)r", "CCMN(W|X)(i|r)", 716 "CCMP(W|X)(i|r)", "CSEL(W|X)r", 717 "CSINC(W|X)r", "CSINV(W|X)r", 718 "CSNEG(W|X)r")>; 719 720def : WriteRes<WriteIEReg, [THX3T110I0123]> { 721 let Latency = 1; 722 let ResourceCycles = [1]; 723 let NumMicroOps = 2; 724} 725 726def : InstRW<[WriteIEReg], 727 (instregex "ADD?(W|X)r(i|r|s|x)", "ADDS?(W|X)r(i|r|s|x)(64)?", 728 "AND?(W|X)r(i|r|s|x)", "ANDS?(W|X)r(i|r|s|x)", 729 "ADC(W|X)r", 730 "BIC?(W|X)r(i|r|s|x)", "BICS?(W|X)r(i|r|s|x)", 731 "EON?(W|X)r(i|r|s|x)", "ORN?(W|X)r(i|r|s|x)", 732 "ORR?(W|X)r(i|r|s|x)", "SUB?(W|X)r(i|r|s|x)", 733 "SUBS?(W|X)r(i|r|s|x)", "SBC(W|X)r", 734 "SBCS(W|X)r", "CCMN(W|X)(i|r)", 735 "CCMP(W|X)(i|r)", "CSEL(W|X)r", 736 "CSINC(W|X)r", "CSINV(W|X)r", 737 "CSNEG(W|X)r")>; 738 739// Move immed 740def : WriteRes<WriteImm, [THX3T110I0123]> { 741 let Latency = 1; 742 let NumMicroOps = 2; 743} 744 745def : InstRW<[THX3T110Write_1Cyc_I0123], 746 (instrs MOVKWi, MOVKXi, MOVNWi, MOVNXi, MOVZWi, MOVZXi)>; 747 748def : InstRW<[THX3T110Write_1Cyc_I0123], 749 (instrs ASRVWr, ASRVXr, LSLVWr, LSLVXr, RORVWr, RORVXr)>; 750 751// Variable shift 752def : WriteRes<WriteIS, [THX3T110I0123]> { 753 let Latency = 1; 754 let NumMicroOps = 2; 755} 756 757//--- 758// 3.4 Divide and Multiply Instructions 759//--- 760 761// Divide, W-form 762// Latency range of 13-23/13-39. 763def : WriteRes<WriteID32, [THX3T110I1]> { 764 let Latency = 39; 765 let ResourceCycles = [39]; 766 let NumMicroOps = 4; 767} 768 769// Divide, X-form 770def : WriteRes<WriteID64, [THX3T110I1]> { 771 let Latency = 23; 772 let ResourceCycles = [23]; 773 let NumMicroOps = 4; 774} 775 776// Multiply accumulate, W-form 777def : WriteRes<WriteIM32, [THX3T110I0123]> { 778 let Latency = 5; 779 let NumMicroOps = 3; 780} 781 782// Multiply accumulate, X-form 783def : WriteRes<WriteIM64, [THX3T110I0123]> { 784 let Latency = 5; 785 let NumMicroOps = 3; 786} 787 788//def : InstRW<[WriteIM32, ReadIM, ReadIM, ReadIMA, THX3T110Write_5Cyc_I012], 789// (instrs MADDWrrr, MSUBWrrr)>; 790def : InstRW<[WriteIM32], (instrs MADDWrrr, MSUBWrrr)>; 791def : InstRW<[WriteIM32], (instrs MADDXrrr, MSUBXrrr)>; 792def : InstRW<[THX3T110Write_5Cyc_I0123], 793 (instregex "(S|U)(MADDL|MSUBL)rrr")>; 794 795def : InstRW<[WriteID32], (instrs SDIVWr, UDIVWr)>; 796def : InstRW<[WriteID64], (instrs SDIVXr, UDIVXr)>; 797 798// Bitfield extract, two reg 799def : WriteRes<WriteExtr, [THX3T110I0123]> { 800 let Latency = 1; 801 let NumMicroOps = 2; 802} 803 804// Multiply high 805def : InstRW<[THX3T110Write_4Cyc_I1], (instrs SMULHrr, UMULHrr)>; 806 807// Miscellaneous Data-Processing Instructions 808// Bitfield extract 809def : InstRW<[THX3T110Write_1Cyc_I0123], (instrs EXTRWrri, EXTRXrri)>; 810 811// Bitifield move - basic 812def : InstRW<[THX3T110Write_1Cyc_I0123], 813 (instrs SBFMWri, SBFMXri, UBFMWri, UBFMXri)>; 814 815// Bitfield move, insert 816def : InstRW<[THX3T110Write_1Cyc_I0123], (instregex "^BFM")>; 817def : InstRW<[THX3T110Write_1Cyc_I0123], (instregex "(S|U)?BFM.*")>; 818 819// Count leading 820def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], 821 (instregex "^CLS(W|X)r$", "^CLZ(W|X)r$")>; 822 823// Reverse bits 824def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instrs RBITWr, RBITXr)>; 825 826// Cryptography Extensions 827def : InstRW<[THX3T110Write_4Cyc_F0123], (instregex "^AES[DE]")>; 828def : InstRW<[THX3T110Write_4Cyc_F0123], (instregex "^AESI?MC")>; 829def : InstRW<[THX3T110Write_4Cyc_F0123], (instregex "^PMULL")>; 830def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA1SU0")>; 831def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA1(H|SU1)")>; 832def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA1[CMP]")>; 833def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA256SU0")>; 834def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA256(H|H2|SU1)")>; 835 836// CRC Instructions 837// def : InstRW<[THX3T110Write_4Cyc_I1], (instregex "^CRC32", "^CRC32C")>; 838def : InstRW<[THX3T110Write_4Cyc_I1], 839 (instrs CRC32Brr, CRC32Hrr, CRC32Wrr, CRC32Xrr)>; 840 841def : InstRW<[THX3T110Write_4Cyc_I1], 842 (instrs CRC32CBrr, CRC32CHrr, CRC32CWrr, CRC32CXrr)>; 843 844// Reverse bits/bytes 845// NOTE: Handled by WriteI. 846 847//--- 848// 3.6 Load Instructions 849// 3.10 FP Load Instructions 850//--- 851 852// Load register, literal 853// Load register, unscaled immed 854// Load register, immed unprivileged 855// Load register, unsigned immed 856def : WriteRes<WriteLD, [THX3T110LS]> { 857 let Latency = 4; 858 let NumMicroOps = 4; 859} 860 861// Load register, immed post-index 862// NOTE: Handled by WriteLD, WriteI. 863// Load register, immed pre-index 864// NOTE: Handled by WriteLD, WriteAdr. 865def : WriteRes<WriteAdr, [THX3T110I0123]> { 866 let Latency = 1; 867 let NumMicroOps = 2; 868} 869 870// Load pair, immed offset, normal 871// Load pair, immed offset, signed words, base != SP 872// Load pair, immed offset signed words, base = SP 873// LDP only breaks into *one* LS micro-op. Thus 874// the resources are handled by WriteLD. 875def : WriteRes<WriteLDHi, []> { 876 let Latency = 4; 877 let NumMicroOps = 4; 878} 879 880// Load register offset, basic 881// Load register, register offset, scale by 4/8 882// Load register, register offset, scale by 2 883// Load register offset, extend 884// Load register, register offset, extend, scale by 4/8 885// Load register, register offset, extend, scale by 2 886def THX3T110WriteLDIdx : SchedWriteVariant<[ 887 SchedVar<ScaledIdxPred, [THX3T110Write_4Cyc_LS01_I0123_I0123]>, 888 SchedVar<NoSchedPred, [THX3T110Write_4Cyc_LS01_I0123]>]>; 889def : SchedAlias<WriteLDIdx, THX3T110WriteLDIdx>; 890 891def THX3T110ReadAdrBase : SchedReadVariant<[ 892 SchedVar<ScaledIdxPred, [ReadDefault]>, 893 SchedVar<NoSchedPred, [ReadDefault]>]>; 894def : SchedAlias<ReadAdrBase, THX3T110ReadAdrBase>; 895 896// Load pair, immed pre-index, normal 897// Load pair, immed pre-index, signed words 898// Load pair, immed post-index, normal 899// Load pair, immed post-index, signed words 900def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPDi)>; 901def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPQi)>; 902def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPSi)>; 903def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPWi)>; 904def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPXi)>; 905 906def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPDi)>; 907def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPQi)>; 908def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPSi)>; 909def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPSWi)>; 910def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPWi)>; 911def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPXi)>; 912 913def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRBui)>; 914def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRDui)>; 915def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRHui)>; 916def : InstRW<[THX3T110Write_5Cyc_LS01], (instrs LDRQui)>; 917def : InstRW<[THX3T110Write_5Cyc_LS01], (instrs LDRSui)>; 918 919def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRDl)>; 920def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRQl)>; 921def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRWl)>; 922def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRXl)>; 923 924def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRBi)>; 925def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRHi)>; 926def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRWi)>; 927def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRXi)>; 928 929def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSBWi)>; 930def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSBXi)>; 931def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSHWi)>; 932def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSHXi)>; 933def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSWi)>; 934 935def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr], 936 (instrs LDPDpre)>; 937def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr], 938 (instrs LDPQpre)>; 939def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr], 940 (instrs LDPSpre)>; 941def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr], 942 (instrs LDPWpre)>; 943def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr], 944 (instrs LDPWpre)>; 945 946def : InstRW<[THX3T110Write_4Cyc_LS01, WriteAdr], 947 (instrs LDRBpre, LDRDpre, LDRHpre, LDRQpre, 948 LDRSpre, LDRWpre, LDRXpre, 949 LDRSBWpre, LDRSBXpre, LDRSBWpost, LDRSBXpost, 950 LDRSHWpre, LDRSHXpre, LDRSHWpost, LDRSHXpost, 951 LDRBBpre, LDRBBpost, LDRHHpre, LDRHHpost)>; 952 953def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr], 954 (instrs LDPDpost, LDPQpost, LDPSpost, LDPWpost, LDPXpost)>; 955 956def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteI], 957 (instrs LDRBpost, LDRDpost, LDRHpost, 958 LDRQpost, LDRSpost, LDRWpost, LDRXpost)>; 959 960def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteLDHi, WriteAdr], 961 (instrs LDPDpre, LDPQpre, LDPSpre, LDPWpre, LDPXpre)>; 962 963def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteAdr], 964 (instrs LDRBpre, LDRDpre, LDRHpre, LDRQpre, 965 LDRSpre, LDRWpre, LDRXpre)>; 966 967def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteLDHi, WriteAdr], 968 (instrs LDPDpost, LDPQpost, LDPSpost, LDPWpost, LDPXpost)>; 969 970def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteI], 971 (instrs LDRBpost, LDRDpost, LDRHpost, LDRQpost, 972 LDRSpost, LDRWpost, LDRXpost)>; 973 974def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRBroW)>; 975def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRDroW)>; 976def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHroW)>; 977def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHHroW)>; 978def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRQroW)>; 979def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSroW)>; 980def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHWroW)>; 981def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHXroW)>; 982def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRWroW)>; 983def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRXroW)>; 984 985def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRBroX)>; 986def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRDroX)>; 987def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHHroX)>; 988def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHroX)>; 989def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRQroX)>; 990def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSroX)>; 991def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHWroX)>; 992def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHXroX)>; 993def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRWroX)>; 994def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRXroX)>; 995 996def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURBi)>; 997def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURBBi)>; 998def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURDi)>; 999def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURHi)>; 1000def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURHHi)>; 1001def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURQi)>; 1002def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSi)>; 1003def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURXi)>; 1004def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSBWi)>; 1005def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSBXi)>; 1006def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSHWi)>; 1007def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSHXi)>; 1008def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSWi)>; 1009 1010// Load exclusive 1011def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDAR(B|H|W|X)$")>; 1012def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDAXR(B|H|W|X)$")>; 1013def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDXR(B|H|W|X)$")>; 1014def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDAXP(W|X)$")>; 1015def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDXP(W|X)$")>; 1016 1017//--- 1018// Prefetch 1019//--- 1020def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMl)>; 1021def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFUMi)>; 1022def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMui)>; 1023def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMroW)>; 1024def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMroX)>; 1025 1026//-- 1027// 3.7 Store Instructions 1028// 3.11 FP Store Instructions 1029//-- 1030 1031// Store register, unscaled immed 1032// Store register, immed unprivileged 1033// Store register, unsigned immed 1034def : WriteRes<WriteST, [THX3T110LS, THX3T110SD]> { 1035 let Latency = 1; 1036 let NumMicroOps = 2; 1037} 1038 1039// Store register, immed post-index 1040// NOTE: Handled by WriteAdr, WriteST, ReadAdrBase 1041 1042// Store register, immed pre-index 1043// NOTE: Handled by WriteAdr, WriteST 1044 1045// Store register, register offset, basic 1046// Store register, register offset, scaled by 4/8 1047// Store register, register offset, scaled by 2 1048// Store register, register offset, extend 1049// Store register, register offset, extend, scale by 4/8 1050// Store register, register offset, extend, scale by 1 1051def : WriteRes<WriteSTIdx, [THX3T110LS, THX3T110SD, THX3T110I0123]> { 1052 let Latency = 1; 1053 let NumMicroOps = 2; 1054} 1055 1056// Store pair, immed offset, W-form 1057// Store pair, immed offset, X-form 1058def : WriteRes<WriteSTP, [THX3T110LS, THX3T110SD]> { 1059 let Latency = 1; 1060 let NumMicroOps = 2; 1061} 1062 1063// Store pair, immed post-index, W-form 1064// Store pair, immed post-index, X-form 1065// Store pair, immed pre-index, W-form 1066// Store pair, immed pre-index, X-form 1067// NOTE: Handled by WriteAdr, WriteSTP. 1068def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURBi)>; 1069def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURBBi)>; 1070def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURDi)>; 1071def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURHi)>; 1072def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURHHi)>; 1073def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURQi)>; 1074def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURSi)>; 1075def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURWi)>; 1076def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURXi)>; 1077 1078def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRBi)>; 1079def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRHi)>; 1080def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRWi)>; 1081def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRXi)>; 1082 1083def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPDi)>; 1084def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPQi)>; 1085def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPXi)>; 1086def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPWi)>; 1087 1088def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPDi)>; 1089def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPQi)>; 1090def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPXi)>; 1091def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPWi)>; 1092 1093def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRBui)>; 1094def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRDui)>; 1095def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRHui)>; 1096def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRQui)>; 1097def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRXui)>; 1098def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRWui)>; 1099 1100def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRBui)>; 1101def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRDui)>; 1102def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRHui)>; 1103def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRQui)>; 1104def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRXui)>; 1105def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRWui)>; 1106 1107def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRBui)>; 1108def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRDui)>; 1109def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRHui)>; 1110def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRQui)>; 1111def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRXui)>; 1112def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRWui)>; 1113 1114def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1115 (instrs STPDpre, STPDpost)>; 1116def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1117 (instrs STPDpre, STPDpost)>; 1118def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1119 (instrs STPQpre, STPQpost)>; 1120def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1121 (instrs STPQpre, STPQpost)>; 1122def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1123 (instrs STPSpre, STPSpost)>; 1124def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1125 (instrs STPSpre, STPSpost)>; 1126def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1127 (instrs STPWpre, STPWpost)>; 1128def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1129 (instrs STPWpre, STPWpost)>; 1130def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1131 (instrs STPXpre, STPXpost)>; 1132def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1133 (instrs STPXpre, STPXpost)>; 1134def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1135 (instrs STRBpre, STRBpost)>; 1136def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1137 (instrs STRBpre, STRBpost)>; 1138def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1139 (instrs STRBBpre, STRBBpost)>; 1140def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1141 (instrs STRBBpre, STRBBpost)>; 1142def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1143 (instrs STRDpre, STRDpost)>; 1144def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1145 (instrs STRDpre, STRDpost)>; 1146def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1147 (instrs STRHpre, STRHpost)>; 1148def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1149 (instrs STRHpre, STRHpost)>; 1150def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1151 (instrs STRHHpre, STRHHpost)>; 1152def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1153 (instrs STRHHpre, STRHHpost)>; 1154def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1155 (instrs STRQpre, STRQpost)>; 1156def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1157 (instrs STRQpre, STRQpost)>; 1158def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1159 (instrs STRSpre, STRSpost)>; 1160def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1161 (instrs STRSpre, STRSpost)>; 1162def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1163 (instrs STRWpre, STRWpost)>; 1164def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1165 (instrs STRWpre, STRWpost)>; 1166def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123], 1167 (instrs STRXpre, STRXpost)>; 1168def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1169 (instrs STRXpre, STRXpost)>; 1170def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1171 (instrs STRBroW, STRBroX)>; 1172def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1173 (instrs STRBBroW, STRBBroX)>; 1174def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1175 (instrs STRDroW, STRDroX)>; 1176def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1177 (instrs STRHroW, STRHroX)>; 1178def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1179 (instrs STRHHroW, STRHHroX)>; 1180def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1181 (instrs STRQroW, STRQroX)>; 1182def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1183 (instrs STRSroW, STRSroX)>; 1184def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1185 (instrs STRWroW, STRWroX)>; 1186def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase], 1187 (instrs STRXroW, STRXroX)>; 1188 1189// Store exclusive 1190def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instrs STNPWi, STNPXi)>; 1191def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STLR(B|H|W|X)$")>; 1192def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STXP(W|X)$")>; 1193def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STXR(B|H|W|X)$")>; 1194def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STLXP(W|X)$")>; 1195def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STLXR(B|H|W|X)$")>; 1196 1197//--- 1198// 3.8 FP Data Processing Instructions 1199//--- 1200 1201// FP absolute value 1202// FP min/max 1203// FP negate 1204def : WriteRes<WriteF, [THX3T110FP0123]> { 1205 let Latency = 5; 1206 let NumMicroOps = 2; 1207} 1208 1209// FP arithmetic 1210def : InstRW<[THX3T110Write_6Cyc_F01], (instregex "^FADD", "^FSUB")>; 1211 1212// FP compare 1213def : WriteRes<WriteFCmp, [THX3T110FP0123]> { 1214 let Latency = 5; 1215 let NumMicroOps = 2; 1216} 1217 1218// FP Mul, Div, Sqrt 1219def : WriteRes<WriteFDiv, [THX3T110FP0123]> { 1220 let Latency = 22; 1221 let ResourceCycles = [19]; 1222} 1223 1224def THX3T110XWriteFDiv : SchedWriteRes<[THX3T110FP0123]> { 1225 let Latency = 16; 1226 let ResourceCycles = [8]; 1227 let NumMicroOps = 4; 1228} 1229 1230def THX3T110XWriteFDivSP : SchedWriteRes<[THX3T110FP0123]> { 1231 let Latency = 16; 1232 let ResourceCycles = [8]; 1233 let NumMicroOps = 4; 1234} 1235 1236def THX3T110XWriteFDivDP : SchedWriteRes<[THX3T110FP0123]> { 1237 let Latency = 23; 1238 let ResourceCycles = [12]; 1239 let NumMicroOps = 4; 1240} 1241 1242def THX3T110XWriteFSqrtSP : SchedWriteRes<[THX3T110FP0123]> { 1243 let Latency = 16; 1244 let ResourceCycles = [8]; 1245 let NumMicroOps = 4; 1246} 1247 1248def THX3T110XWriteFSqrtDP : SchedWriteRes<[THX3T110FP0123]> { 1249 let Latency = 23; 1250 let ResourceCycles = [12]; 1251 let NumMicroOps = 4; 1252} 1253 1254// FP divide, S-form 1255// FP square root, S-form 1256def : InstRW<[THX3T110XWriteFDivSP], (instrs FDIVSrr)>; 1257def : InstRW<[THX3T110XWriteFSqrtSP], (instrs FSQRTSr)>; 1258def : InstRW<[THX3T110XWriteFDivSP], (instregex "^FDIVv.*32$")>; 1259def : InstRW<[THX3T110XWriteFSqrtSP], (instregex "^.*SQRT.*32$")>; 1260def : InstRW<[THX3T110Write_16Cyc_F01], (instregex "^FDIVSrr", "^FSQRTSr")>; 1261 1262// FP divide, D-form 1263// FP square root, D-form 1264def : InstRW<[THX3T110XWriteFDivDP], (instrs FDIVDrr)>; 1265def : InstRW<[THX3T110XWriteFSqrtDP], (instrs FSQRTDr)>; 1266def : InstRW<[THX3T110XWriteFDivDP], (instregex "^FDIVv.*64$")>; 1267def : InstRW<[THX3T110XWriteFSqrtDP], (instregex "^.*SQRT.*64$")>; 1268def : InstRW<[THX3T110Write_23Cyc_F01], (instregex "^FDIVDrr", "^FSQRTDr")>; 1269 1270// FP multiply 1271// FP multiply accumulate 1272def : WriteRes<WriteFMul, [THX3T110FP0123]> { 1273 let Latency = 6; 1274 let ResourceCycles = [2]; 1275 let NumMicroOps = 3; 1276} 1277 1278def THX3T110XWriteFMul : SchedWriteRes<[THX3T110FP0123]> { 1279 let Latency = 6; 1280 let ResourceCycles = [2]; 1281 let NumMicroOps = 3; 1282} 1283 1284def THX3T110XWriteFMulAcc : SchedWriteRes<[THX3T110FP0123]> { 1285 let Latency = 6; 1286 let ResourceCycles = [2]; 1287 let NumMicroOps = 3; 1288} 1289 1290def : InstRW<[THX3T110XWriteFMul], (instregex "^FMUL", "^FNMUL")>; 1291def : InstRW<[THX3T110XWriteFMulAcc], 1292 (instregex "^FMADD", "^FMSUB", "^FNMADD", "^FNMSUB")>; 1293 1294// FP round to integral 1295def : InstRW<[THX3T110Write_7Cyc_F01], 1296 (instregex "^FRINT(A|I|M|N|P|X|Z)(Sr|Dr)")>; 1297 1298// FP select 1299def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^FCSEL")>; 1300 1301//--- 1302// 3.9 FP Miscellaneous Instructions 1303//--- 1304 1305// FP convert, from vec to vec reg 1306// FP convert, from gen to vec reg 1307// FP convert, from vec to gen reg 1308def : WriteRes<WriteFCvt, [THX3T110FP0123]> { 1309 let Latency = 7; 1310 let NumMicroOps = 3; 1311} 1312 1313// FP move, immed 1314// FP move, register 1315def : WriteRes<WriteFImm, [THX3T110FP0123]> { 1316 let Latency = 4; 1317 let NumMicroOps = 2; 1318} 1319 1320// FP transfer, from gen to vec reg 1321// FP transfer, from vec to gen reg 1322def : WriteRes<WriteFCopy, [THX3T110FP0123]> { 1323 let Latency = 4; 1324 let NumMicroOps = 2; 1325} 1326 1327def : InstRW<[THX3T110Write_5Cyc_F01], (instrs FMOVXDHighr, FMOVDXHighr)>; 1328 1329//--- 1330// 3.12 ASIMD Integer Instructions 1331//--- 1332 1333// ASIMD absolute diff, D-form 1334// ASIMD absolute diff, Q-form 1335// ASIMD absolute diff accum, D-form 1336// ASIMD absolute diff accum, Q-form 1337// ASIMD absolute diff accum long 1338// ASIMD absolute diff long 1339// ASIMD arith, basic 1340// ASIMD arith, complex 1341// ASIMD compare 1342// ASIMD logical (AND, BIC, EOR) 1343// ASIMD max/min, basic 1344// ASIMD max/min, reduce, 4H/4S 1345// ASIMD max/min, reduce, 8B/8H 1346// ASIMD max/min, reduce, 16B 1347// ASIMD multiply, D-form 1348// ASIMD multiply, Q-form 1349// ASIMD multiply accumulate long 1350// ASIMD multiply accumulate saturating long 1351// ASIMD multiply long 1352// ASIMD pairwise add and accumulate 1353// ASIMD shift accumulate 1354// ASIMD shift by immed, basic 1355// ASIMD shift by immed and insert, basic, D-form 1356// ASIMD shift by immed and insert, basic, Q-form 1357// ASIMD shift by immed, complex 1358// ASIMD shift by register, basic, D-form 1359// ASIMD shift by register, basic, Q-form 1360// ASIMD shift by register, complex, D-form 1361// ASIMD shift by register, complex, Q-form 1362def : WriteRes<WriteVd, [THX3T110FP0123]> { 1363 let Latency = 5; 1364 let NumMicroOps = 4; 1365 let ResourceCycles = [4]; 1366} 1367def : WriteRes<WriteVq, [THX3T110FP0123]> { 1368 let Latency = 5; 1369 let NumMicroOps = 4; 1370 let ResourceCycles = [4]; 1371} 1372 1373// ASIMD arith, reduce, 4H/4S 1374// ASIMD arith, reduce, 8B/8H 1375// ASIMD arith, reduce, 16B 1376 1377// ASIMD logical (MVN (alias for NOT), ORN, ORR) 1378def : InstRW<[THX3T110Write_5Cyc_F0123], 1379 (instregex "^ANDv", "^BICv", "^EORv", "^ORRv", "^ORNv", "^NOTv")>; 1380 1381// ASIMD arith, reduce 1382def : InstRW<[THX3T110Write_5Cyc_F0123], 1383 (instregex "^ADDVv", "^SADDLVv", "^UADDLVv")>; 1384 1385// ASIMD polynomial (8x8) multiply long 1386def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^(S|U|SQD)MULL")>; 1387def : InstRW<[THX3T110Write_5Cyc_F0123], 1388 (instregex "(S|U|SQD)(MLAL|MLSL|MULL)v.*")>; 1389def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^PMULL(v8i8|v16i8)")>; 1390def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^PMULL(v1i64|v2i64)")>; 1391 1392// ASIMD absolute diff accum, D-form 1393def : InstRW<[THX3T110Write_5Cyc_F0123], 1394 (instregex "^[SU]ABA(v8i8|v4i16|v2i32)$")>; 1395// ASIMD absolute diff accum, Q-form 1396def : InstRW<[THX3T110Write_5Cyc_F0123], 1397 (instregex "^[SU]ABA(v16i8|v8i16|v4i32)$")>; 1398// ASIMD absolute diff accum long 1399def : InstRW<[THX3T110Write_5Cyc_F0123], 1400 (instregex "^[SU]ABAL")>; 1401// ASIMD arith, reduce, 4H/4S 1402def : InstRW<[THX3T110Write_5Cyc_F0123], 1403 (instregex "^[SU]?ADDL?V(v8i8|v4i16|v2i32)v$")>; 1404// ASIMD arith, reduce, 8B 1405def : InstRW<[THX3T110Write_5Cyc_F0123], 1406 (instregex "^[SU]?ADDL?V(v8i16|v4i32)v$")>; 1407// ASIMD arith, reduce, 16B/16H 1408def : InstRW<[THX3T110Write_10Cyc_F0123], 1409 (instregex "^[SU]?ADDL?Vv16i8v$")>; 1410// ASIMD max/min, reduce, 4H/4S 1411def : InstRW<[THX3T110Write_5Cyc_F0123], 1412 (instregex "^[SU](MIN|MAX)V(v4i16|v4i32)v$")>; 1413// ASIMD max/min, reduce, 8B/8H 1414def : InstRW<[THX3T110Write_5Cyc_F0123], 1415 (instregex "^[SU](MIN|MAX)V(v8i8|v8i16)v$")>; 1416// ASIMD max/min, reduce, 16B/16H 1417def : InstRW<[THX3T110Write_5Cyc_F0123], 1418 (instregex "^[SU](MIN|MAX)Vv16i8v$")>; 1419// ASIMD multiply, D-form 1420def : InstRW<[THX3T110Write_5Cyc_F0123], 1421 (instregex "^(P?MUL|SQR?DMULH)" # 1422 "(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)" # 1423 "(_indexed)?$")>; 1424// ASIMD multiply, Q-form 1425def : InstRW<[THX3T110Write_5Cyc_F0123], 1426 (instregex "^(P?MUL|SQR?DMULH)(v16i8|v8i16|v4i32)(_indexed)?$")>; 1427// ASIMD multiply accumulate, D-form 1428def : InstRW<[THX3T110Write_5Cyc_F0123], 1429 (instregex "^ML[AS](v8i8|v4i16|v2i32)(_indexed)?$")>; 1430// ASIMD multiply accumulate, Q-form 1431def : InstRW<[THX3T110Write_5Cyc_F0123], 1432 (instregex "^ML[AS](v16i8|v8i16|v4i32)(_indexed)?$")>; 1433// ASIMD shift accumulate 1434def : InstRW<[THX3T110Write_5Cyc_F0123], 1435 (instregex "SRSRAv","SSRAv","URSRAv","USRAv")>; 1436 1437// ASIMD shift by immed, basic 1438def : InstRW<[THX3T110Write_5Cyc_F0123], 1439 (instregex "RSHRNv","SHRNv", "SQRSHRNv","SQRSHRUNv", 1440 "SQSHRNv","SQSHRUNv", "UQRSHRNv", 1441 "UQSHRNv","SQXTNv","SQXTUNv","UQXTNv")>; 1442// ASIMD shift by immed, complex 1443def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^[SU]?(Q|R){1,2}SHR")>; 1444def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SQSHLU")>; 1445// ASIMD shift by register, basic, Q-form 1446def : InstRW<[THX3T110Write_5Cyc_F01], 1447 (instregex "^[SU]SHL(v16i8|v8i16|v4i32|v2i64)")>; 1448// ASIMD shift by register, complex, D-form 1449def : InstRW<[THX3T110Write_5Cyc_F0123], 1450 (instregex "^[SU][QR]{1,2}SHL" # 1451 "(v1i8|v1i16|v1i32|v1i64|v8i8|v4i16|v2i32|b|d|h|s)")>; 1452// ASIMD shift by register, complex, Q-form 1453def : InstRW<[THX3T110Write_5Cyc_F0123], 1454 (instregex "^[SU][QR]{1,2}SHL(v16i8|v8i16|v4i32|v2i64)")>; 1455 1456// ASIMD Arithmetic 1457def : InstRW<[THX3T110Write_5Cyc_F0123], 1458 (instregex "(ADD|SUB)(v8i8|v4i16|v2i32|v1i64)")>; 1459def : InstRW<[THX3T110Write_5Cyc_F0123], 1460 (instregex "(ADD|SUB)(v16i8|v8i16|v4i32|v2i64)")>; 1461def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "(ADD|SUB)HNv.*")>; 1462def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "(RADD|RSUB)HNv.*")>; 1463def : InstRW<[THX3T110Write_5Cyc_F0123], 1464 (instregex "^SQADD", "^SQNEG", "^SQSUB", "^SRHADD", 1465 "^SUQADD", "^UQADD", "^UQSUB", "^URHADD", "^USQADD")>; 1466def : InstRW<[THX3T110Write_5Cyc_F0123], 1467 (instregex "ADDP(v16i8|v8i16|v4i32|v2i64)")>; 1468def : InstRW<[THX3T110Write_5Cyc_F0123], 1469 (instregex "((AND|ORN|EOR|EON)S?(Xr[rsi]|v16i8|v8i16|v4i32)|" # 1470 "(ORR|BIC)S?(Xr[rs]|v16i8|v8i16|v4i32))")>; 1471def : InstRW<[THX3T110Write_5Cyc_F0123], 1472 (instregex "(CLS|CLZ|CNT)(v4i32|v8i16|v16i8)")>; 1473def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SADALP","^UADALP")>; 1474def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SADDLPv","^UADDLPv")>; 1475def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SADDLV","^UADDLV")>; 1476def : InstRW<[THX3T110Write_5Cyc_F0123], 1477 (instregex "^ADDVv","^SMAXVv","^UMAXVv","^SMINVv","^UMINVv")>; 1478def : InstRW<[THX3T110Write_5Cyc_F0123], 1479 (instregex "^SABAv","^UABAv","^SABALv","^UABALv")>; 1480def : InstRW<[THX3T110Write_5Cyc_F0123], 1481 (instregex "^SQADDv","^SQSUBv","^UQADDv","^UQSUBv")>; 1482def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SUQADDv","^USQADDv")>; 1483def : InstRW<[THX3T110Write_5Cyc_F0123], 1484 (instregex "^ADDHNv","^RADDHNv", "^RSUBHNv", 1485 "^SQABS", "^SQADD", "^SQNEG", "^SQSUB", 1486 "^SRHADD", "^SUBHNv", "^SUQADD", 1487 "^UQADD", "^UQSUB", "^URHADD", "^USQADD")>; 1488def : InstRW<[THX3T110Write_5Cyc_F0123], 1489 (instregex "^CMEQv","^CMGEv","^CMGTv", 1490 "^CMLEv","^CMLTv", "^CMHIv","^CMHSv")>; 1491def : InstRW<[THX3T110Write_5Cyc_F0123], 1492 (instregex "^SMAXv","^SMINv","^UMAXv","^UMINv", 1493 "^SMAXPv","^SMINPv","^UMAXPv","^UMINPv")>; 1494def : InstRW<[THX3T110Write_5Cyc_F0123], 1495 (instregex "^SABDv","^UABDv", "^SABDLv","^UABDLv")>; 1496 1497//--- 1498// 3.13 ASIMD Floating-point Instructions 1499//--- 1500 1501// ASIMD FP absolute value 1502def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FABSv")>; 1503 1504// ASIMD FP arith, normal, D-form 1505// ASIMD FP arith, normal, Q-form 1506def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], 1507 (instregex "^FABDv", "^FADDv", "^FSUBv")>; 1508 1509// ASIMD FP arith,pairwise, D-form 1510// ASIMD FP arith, pairwise, Q-form 1511def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^FADDPv")>; 1512 1513// ASIMD FP compare, D-form 1514// ASIMD FP compare, Q-form 1515def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FACGEv", "^FACGTv")>; 1516def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FCMEQv", "^FCMGEv", 1517 "^FCMGTv", "^FCMLEv", 1518 "^FCMLTv")>; 1519 1520// ASIMD FP round, D-form 1521def : InstRW<[THX3T110Write_5Cyc_F0123], 1522 (instregex "^FRINT[AIMNPXZ](v2f32)")>; 1523// ASIMD FP round, Q-form 1524def : InstRW<[THX3T110Write_5Cyc_F0123], 1525 (instregex "^FRINT[AIMNPXZ](v4f32|v2f64)")>; 1526 1527// ASIMD FP convert, long 1528// ASIMD FP convert, narrow 1529// ASIMD FP convert, other, D-form 1530// ASIMD FP convert, other, Q-form 1531// NOTE: Handled by WriteV. 1532 1533// ASIMD FP convert, long and narrow 1534def : InstRW<[THX3T110Write_5Cyc_F01], (instregex "^FCVT(L|N|XN)v")>; 1535// ASIMD FP convert, other, D-form 1536def : InstRW<[THX3T110Write_5Cyc_F01], 1537 (instregex "^[FVSU]CVT([AMNPZ][SU])?(_Int)?(v2f32|v1i32|v2i32|v1i64)")>; 1538// ASIMD FP convert, other, Q-form 1539def : InstRW<[THX3T110Write_5Cyc_F01], 1540 (instregex "^[FVSU]CVT([AMNPZ][SU])?(_Int)?(v4f32|v2f64|v4i32|v2i64)")>; 1541 1542// ASIMD FP divide, D-form, F32 1543def : InstRW<[THX3T110Write_16Cyc_F0123], (instrs FDIVv2f32)>; 1544def : InstRW<[THX3T110Write_16Cyc_F0123], (instregex "FDIVv2f32")>; 1545 1546// ASIMD FP divide, Q-form, F32 1547def : InstRW<[THX3T110Write_16Cyc_F0123], (instrs FDIVv4f32)>; 1548def : InstRW<[THX3T110Write_16Cyc_F0123], (instregex "FDIVv4f32")>; 1549 1550// ASIMD FP divide, Q-form, F64 1551def : InstRW<[THX3T110Write_23Cyc_F0123], (instrs FDIVv2f64)>; 1552def : InstRW<[THX3T110Write_23Cyc_F0123], (instregex "FDIVv2f64")>; 1553 1554// ASIMD FP max/min, normal, D-form 1555// ASIMD FP max/min, normal, Q-form 1556def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FMAXv", "^FMAXNMv", 1557 "^FMINv", "^FMINNMv")>; 1558 1559// ASIMD FP max/min, pairwise, D-form 1560// ASIMD FP max/min, pairwise, Q-form 1561def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FMAXPv", "^FMAXNMPv", 1562 "^FMINPv", "^FMINNMPv")>; 1563 1564// ASIMD FP max/min, reduce 1565def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FMAXVv", "^FMAXNMVv", 1566 "^FMINVv", "^FMINNMVv")>; 1567 1568// ASIMD FP multiply, D-form, FZ 1569// ASIMD FP multiply, D-form, no FZ 1570// ASIMD FP multiply, Q-form, FZ 1571// ASIMD FP multiply, Q-form, no FZ 1572def : InstRW<[THX3T110Write_5Cyc_F0123], 1573 (instregex "^FMULv", "^FMULXv")>; 1574def : InstRW<[THX3T110Write_5Cyc_F0123], 1575 (instregex "^FMULX?(v2f32|v1i32|v2i32|v1i64|32|64)")>; 1576def : InstRW<[THX3T110Write_5Cyc_F0123], 1577 (instregex "^FMULX?(v4f32|v2f64|v4i32|v2i64)")>; 1578 1579// ASIMD FP multiply accumulate, Dform, FZ 1580// ASIMD FP multiply accumulate, Dform, no FZ 1581// ASIMD FP multiply accumulate, Qform, FZ 1582// ASIMD FP multiply accumulate, Qform, no FZ 1583def : InstRW<[THX3T110Write_5Cyc_F0123], 1584 (instregex "^FMLAv", "^FMLSv")>; 1585def : InstRW<[THX3T110Write_5Cyc_F0123], 1586 (instregex "^FML[AS](v2f32|v1i32|v2i32|v1i64)")>; 1587def : InstRW<[THX3T110Write_5Cyc_F0123], 1588 (instregex "^FML[AS](v4f32|v2f64|v4i32|v2i64)")>; 1589 1590// ASIMD FP negate 1591def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FNEGv")>; 1592 1593//-- 1594// 3.14 ASIMD Miscellaneous Instructions 1595//-- 1596 1597// ASIMD bit reverse 1598def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^RBITv")>; 1599 1600// ASIMD bitwise insert, D-form 1601// ASIMD bitwise insert, Q-form 1602def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], 1603 (instregex "^BIFv", "^BITv", "^BSLv")>; 1604 1605// ASIMD count, D-form 1606// ASIMD count, Q-form 1607def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], 1608 (instregex "^CLSv", "^CLZv", "^CNTv")>; 1609 1610// ASIMD duplicate, gen reg 1611// ASIMD duplicate, element 1612def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^DUPv")>; 1613def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^DUP(i8|i16|i32|i64)$")>; 1614def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^DUPv.+gpr")>; 1615 1616// ASIMD extract 1617def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^EXTv")>; 1618 1619// ASIMD extract narrow 1620def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^XTNv")>; 1621 1622// ASIMD extract narrow, saturating 1623def : InstRW<[THX3T110Write_5Cyc_F0123], 1624 (instregex "^SQXTNv", "^SQXTUNv", "^UQXTNv")>; 1625 1626// ASIMD insert, element to element 1627def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^INSv")>; 1628 1629// ASIMD transfer, element to gen reg 1630def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^[SU]MOVv")>; 1631 1632// ASIMD move, integer immed 1633def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^MOVIv")>; 1634 1635// ASIMD move, FP immed 1636def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^FMOVv")>; 1637 1638// ASIMD transpose 1639def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^TRN1", "^TRN2")>; 1640 1641// ASIMD unzip/zip 1642def : InstRW<[THX3T110Write_5Cyc_F0123], 1643 (instregex "^UZP1", "^UZP2", "^ZIP1", "^ZIP2")>; 1644 1645// ASIMD reciprocal estimate, D-form 1646// ASIMD reciprocal estimate, Q-form 1647def : InstRW<[THX3T110Write_5Cyc_F0123], 1648 (instregex "^FRECPEv", "^FRECPXv", "^URECPEv", 1649 "^FRSQRTEv", "^URSQRTEv")>; 1650 1651// ASIMD reciprocal step, D-form, FZ 1652// ASIMD reciprocal step, D-form, no FZ 1653// ASIMD reciprocal step, Q-form, FZ 1654// ASIMD reciprocal step, Q-form, no FZ 1655def : InstRW<[THX3T110Write_5Cyc_F0123], 1656 (instregex "^FRECPSv", "^FRSQRTSv")>; 1657 1658// ASIMD reverse 1659def : InstRW<[THX3T110Write_5Cyc_F0123], 1660 (instregex "^REV16v", "^REV32v", "^REV64v")>; 1661 1662// ASIMD table lookup, D-form 1663// ASIMD table lookup, Q-form 1664def : InstRW<[THX3T110Write_5Cyc_F0123], 1665 (instrs TBLv8i8One, TBLv16i8One, TBXv8i8One, TBXv16i8One)>; 1666def : InstRW<[THX3T110Write_10Cyc_F0123], 1667 (instrs TBLv8i8Two, TBLv16i8Two, TBXv8i8Two, TBXv16i8Two)>; 1668def : InstRW<[THX3T110Write_15Cyc_F0123], 1669 (instrs TBLv8i8Three, TBLv16i8Three, TBXv8i8Three, TBXv16i8Three)>; 1670def : InstRW<[THX3T110Write_20Cyc_F0123], 1671 (instrs TBLv8i8Four, TBLv16i8Four, TBXv8i8Four, TBXv16i8Four)>; 1672 1673// ASIMD transfer, element to word or word 1674def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^[SU]MOVv")>; 1675 1676// ASIMD transfer, element to gen reg 1677def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "(S|U)MOVv.*")>; 1678 1679// ASIMD transfer gen reg to element 1680def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^INSv")>; 1681 1682// ASIMD transpose 1683def : InstRW<[THX3T110Write_5Cyc_F0123], 1684 (instregex "^TRN1v", "^TRN2v", "^UZP1v", "^UZP2v")>; 1685 1686// ASIMD unzip/zip 1687def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^ZIP1v", "^ZIP2v")>; 1688 1689//-- 1690// 3.15 ASIMD Load Instructions 1691//-- 1692 1693// ASIMD load, 1 element, multiple, 1 reg, D-form 1694// ASIMD load, 1 element, multiple, 1 reg, Q-form 1695def : InstRW<[THX3T110Write_4Cyc_LS01], 1696 (instregex "^LD1Onev(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1697def : InstRW<[THX3T110Write_4Cyc_LS01, WriteAdr], 1698 (instregex "^LD1Onev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1699 1700// ASIMD load, 1 element, multiple, 2 reg, D-form 1701// ASIMD load, 1 element, multiple, 2 reg, Q-form 1702def : InstRW<[THX3T110Write_4Cyc_LS01], 1703 (instregex "^LD1Twov(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1704def : InstRW<[THX3T110Write_4Cyc_LS01, WriteAdr], 1705 (instregex "^LD1Twov(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1706 1707// ASIMD load, 1 element, multiple, 3 reg, D-form 1708// ASIMD load, 1 element, multiple, 3 reg, Q-form 1709def : InstRW<[THX3T110Write_5Cyc_LS01], 1710 (instregex "^LD1Threev(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1711def : InstRW<[THX3T110Write_5Cyc_LS01, WriteAdr], 1712 (instregex "^LD1Threev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1713 1714// ASIMD load, 1 element, multiple, 4 reg, D-form 1715// ASIMD load, 1 element, multiple, 4 reg, Q-form 1716def : InstRW<[THX3T110Write_6Cyc_LS01], 1717 (instregex "^LD1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1718def : InstRW<[THX3T110Write_6Cyc_LS01, WriteAdr], 1719 (instregex "^LD1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1720 1721// ASIMD load, 1 element, one lane, B/H/S 1722// ASIMD load, 1 element, one lane, D 1723def : InstRW<[THX3T110Write_5Cyc_LS01_F0123], 1724 (instregex "^LD1i(8|16|32|64)$")>; 1725def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr], 1726 (instregex "^LD1i(8|16|32|64)_POST$")>; 1727 1728// ASIMD load, 1 element, all lanes, D-form, B/H/S 1729// ASIMD load, 1 element, all lanes, D-form, D 1730// ASIMD load, 1 element, all lanes, Q-form 1731def : InstRW<[THX3T110Write_5Cyc_LS01_F0123], 1732 (instregex "^LD1Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1733def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr], 1734 (instregex "^LD1Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1735 1736// ASIMD load, 2 element, multiple, D-form, B/H/S 1737// ASIMD load, 2 element, multiple, Q-form, D 1738def : InstRW<[THX3T110Write_5Cyc_LS01_F0123], 1739 (instregex "^LD2Twov(8b|4h|2s|16b|8h|4s|2d)$")>; 1740def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr], 1741 (instregex "^LD2Twov(8b|4h|2s|16b|8h|4s|2d)_POST$")>; 1742 1743// ASIMD load, 2 element, one lane, B/H 1744// ASIMD load, 2 element, one lane, S 1745// ASIMD load, 2 element, one lane, D 1746def : InstRW<[THX3T110Write_5Cyc_LS01_F0123], 1747 (instregex "^LD2i(8|16|32|64)$")>; 1748def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr], 1749 (instregex "^LD2i(8|16|32|64)_POST$")>; 1750 1751// ASIMD load, 2 element, all lanes, D-form, B/H/S 1752// ASIMD load, 2 element, all lanes, D-form, D 1753// ASIMD load, 2 element, all lanes, Q-form 1754def : InstRW<[THX3T110Write_5Cyc_LS01_F0123], 1755 (instregex "^LD2Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1756def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr], 1757 (instregex "^LD2Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1758 1759// ASIMD load, 3 element, multiple, D-form, B/H/S 1760// ASIMD load, 3 element, multiple, Q-form, B/H/S 1761// ASIMD load, 3 element, multiple, Q-form, D 1762def : InstRW<[THX3T110Write_8Cyc_LS01_F0123], 1763 (instregex "^LD3Threev(8b|4h|2s|16b|8h|4s|2d)$")>; 1764def : InstRW<[THX3T110Write_8Cyc_LS01_F0123, WriteAdr], 1765 (instregex "^LD3Threev(8b|4h|2s|16b|8h|4s|2d)_POST$")>; 1766 1767// ASIMD load, 3 element, one lone, B/H 1768// ASIMD load, 3 element, one lane, S 1769// ASIMD load, 3 element, one lane, D 1770def : InstRW<[THX3T110Write_7Cyc_LS01_F0123], 1771 (instregex "^LD3i(8|16|32|64)$")>; 1772def : InstRW<[THX3T110Write_7Cyc_LS01_F0123, WriteAdr], 1773 (instregex "^LD3i(8|16|32|64)_POST$")>; 1774 1775// ASIMD load, 3 element, all lanes, D-form, B/H/S 1776// ASIMD load, 3 element, all lanes, D-form, D 1777// ASIMD load, 3 element, all lanes, Q-form, B/H/S 1778// ASIMD load, 3 element, all lanes, Q-form, D 1779def : InstRW<[THX3T110Write_7Cyc_LS01_F0123], 1780 (instregex "^LD3Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1781def : InstRW<[THX3T110Write_7Cyc_LS01_F0123, WriteAdr], 1782 (instregex "^LD3Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1783 1784// ASIMD load, 4 element, multiple, D-form, B/H/S 1785// ASIMD load, 4 element, multiple, Q-form, B/H/S 1786// ASIMD load, 4 element, multiple, Q-form, D 1787def : InstRW<[THX3T110Write_8Cyc_LS01_F0123], 1788 (instregex "^LD4Fourv(8b|4h|2s|16b|8h|4s|2d)$")>; 1789def : InstRW<[THX3T110Write_8Cyc_LS01_F0123, WriteAdr], 1790 (instregex "^LD4Fourv(8b|4h|2s|16b|8h|4s|2d)_POST$")>; 1791 1792// ASIMD load, 4 element, one lane, B/H 1793// ASIMD load, 4 element, one lane, S 1794// ASIMD load, 4 element, one lane, D 1795def : InstRW<[THX3T110Write_6Cyc_LS01_F0123], 1796 (instregex "^LD4i(8|16|32|64)$")>; 1797def : InstRW<[THX3T110Write_6Cyc_LS01_F0123, WriteAdr], 1798 (instregex "^LD4i(8|16|32|64)_POST$")>; 1799 1800// ASIMD load, 4 element, all lanes, D-form, B/H/S 1801// ASIMD load, 4 element, all lanes, D-form, D 1802// ASIMD load, 4 element, all lanes, Q-form, B/H/S 1803// ASIMD load, 4 element, all lanes, Q-form, D 1804def : InstRW<[THX3T110Write_6Cyc_LS01_F0123], 1805 (instregex "^LD4Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1806def : InstRW<[THX3T110Write_6Cyc_LS01_F0123, WriteAdr], 1807 (instregex "^LD4Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1808 1809//-- 1810// 3.16 ASIMD Store Instructions 1811//-- 1812 1813// ASIMD store, 1 element, multiple, 1 reg, D-form 1814// ASIMD store, 1 element, multiple, 1 reg, Q-form 1815def : InstRW<[THX3T110Write_1Cyc_LS01], 1816 (instregex "^ST1Onev(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1817def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr], 1818 (instregex "^ST1Onev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1819 1820// ASIMD store, 1 element, multiple, 2 reg, D-form 1821// ASIMD store, 1 element, multiple, 2 reg, Q-form 1822def : InstRW<[THX3T110Write_1Cyc_LS01], 1823 (instregex "^ST1Twov(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1824def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr], 1825 (instregex "^ST1Twov(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1826 1827// ASIMD store, 1 element, multiple, 3 reg, D-form 1828// ASIMD store, 1 element, multiple, 3 reg, Q-form 1829def : InstRW<[THX3T110Write_1Cyc_LS01], 1830 (instregex "^ST1Threev(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1831def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr], 1832 (instregex "^ST1Threev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1833 1834// ASIMD store, 1 element, multiple, 4 reg, D-form 1835// ASIMD store, 1 element, multiple, 4 reg, Q-form 1836def : InstRW<[THX3T110Write_1Cyc_LS01], 1837 (instregex "^ST1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)$")>; 1838def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr], 1839 (instregex "^ST1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>; 1840 1841// ASIMD store, 1 element, one lane, B/H/S 1842// ASIMD store, 1 element, one lane, D 1843def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1844 (instregex "^ST1i(8|16|32|64)$")>; 1845def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1846 (instregex "^ST1i(8|16|32|64)_POST$")>; 1847 1848// ASIMD store, 2 element, multiple, D-form, B/H/S 1849// ASIMD store, 2 element, multiple, Q-form, B/H/S 1850// ASIMD store, 2 element, multiple, Q-form, D 1851def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1852 (instregex "^ST2Twov(8b|4h|2s|16b|8h|4s|2d)$")>; 1853def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1854 (instregex "^ST2Twov(8b|4h|2s|16b|8h|4s|2d)_POST$")>; 1855 1856// ASIMD store, 2 element, one lane, B/H/S 1857// ASIMD store, 2 element, one lane, D 1858def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1859 (instregex "^ST2i(8|16|32|64)$")>; 1860def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1861 (instregex "^ST2i(8|16|32|64)_POST$")>; 1862 1863// ASIMD store, 3 element, multiple, D-form, B/H/S 1864// ASIMD store, 3 element, multiple, Q-form, B/H/S 1865// ASIMD store, 3 element, multiple, Q-form, D 1866def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1867 (instregex "^ST3Threev(8b|4h|2s|16b|8h|4s|2d)$")>; 1868def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1869 (instregex "^ST3Threev(8b|4h|2s|16b|8h|4s|2d)_POST$")>; 1870 1871// ASIMD store, 3 element, one lane, B/H 1872// ASIMD store, 3 element, one lane, S 1873// ASIMD store, 3 element, one lane, D 1874def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1875 (instregex "^ST3i(8|16|32|64)$")>; 1876def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1877 (instregex "^ST3i(8|16|32|64)_POST$")>; 1878 1879// ASIMD store, 4 element, multiple, D-form, B/H/S 1880// ASIMD store, 4 element, multiple, Q-form, B/H/S 1881// ASIMD store, 4 element, multiple, Q-form, D 1882def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1883 (instregex "^ST4Fourv(8b|4h|2s|16b|8h|4s|2d)$")>; 1884def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1885 (instregex "^ST4Fourv(8b|4h|2s|16b|8h|4s|2d)_POST$")>; 1886 1887// ASIMD store, 4 element, one lane, B/H 1888// ASIMD store, 4 element, one lane, S 1889// ASIMD store, 4 element, one lane, D 1890def : InstRW<[THX3T110Write_1Cyc_LS01_F0123], 1891 (instregex "^ST4i(8|16|32|64)$")>; 1892def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr], 1893 (instregex "^ST4i(8|16|32|64)_POST$")>; 1894 1895// V8.1a Atomics (LSE) 1896def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1897 (instrs CASB, CASH, CASW, CASX)>; 1898 1899def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1900 (instrs CASAB, CASAH, CASAW, CASAX)>; 1901 1902def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1903 (instrs CASLB, CASLH, CASLW, CASLX)>; 1904 1905def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic], 1906 (instrs CASALB, CASALH, CASALW, CASALX)>; 1907 1908def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1909 (instrs LDLARB, LDLARH, LDLARW, LDLARX)>; 1910 1911def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1912 (instrs LDADDB, LDADDH, LDADDW, LDADDX)>; 1913 1914def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1915 (instrs LDADDAB, LDADDAH, LDADDAW, LDADDAX)>; 1916 1917def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1918 (instrs LDADDLB, LDADDLH, LDADDLW, LDADDLX)>; 1919 1920def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic], 1921 (instrs LDADDALB, LDADDALH, LDADDALW, LDADDALX)>; 1922 1923def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1924 (instrs LDCLRB, LDCLRH, LDCLRW, LDCLRX)>; 1925 1926def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1927 (instrs LDCLRAB, LDCLRAH, LDCLRAW, LDCLRAX)>; 1928 1929def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1930 (instrs LDCLRLB, LDCLRLH, LDCLRLW, LDCLRLX)>; 1931 1932def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic], 1933 (instrs LDCLRALB, LDCLRALH, LDCLRALW, LDCLRALX)>; 1934 1935def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1936 (instrs LDEORB, LDEORH, LDEORW, LDEORX)>; 1937 1938def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1939 (instrs LDEORAB, LDEORAH, LDEORAW, LDEORAX)>; 1940 1941def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1942 (instrs LDEORLB, LDEORLH, LDEORLW, LDEORLX)>; 1943 1944def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic], 1945 (instrs LDEORALB, LDEORALH, LDEORALW, LDEORALX)>; 1946 1947def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1948 (instrs LDSETB, LDSETH, LDSETW, LDSETX)>; 1949 1950def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1951 (instrs LDSETAB, LDSETAH, LDSETAW, LDSETAX)>; 1952 1953def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1954 (instrs LDSETLB, LDSETLH, LDSETLW, LDSETLX)>; 1955 1956def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic], 1957 (instrs LDSETALB, LDSETALH, LDSETALW, LDSETALX)>; 1958 1959def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1960 (instrs LDSMAXB, LDSMAXH, LDSMAXW, LDSMAXX, 1961 LDSMAXAB, LDSMAXAH, LDSMAXAW, LDSMAXAX, 1962 LDSMAXLB, LDSMAXLH, LDSMAXLW, LDSMAXLX, 1963 LDSMAXALB, LDSMAXALH, LDSMAXALW, LDSMAXALX)>; 1964 1965def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1966 (instrs LDSMINB, LDSMINH, LDSMINW, LDSMINX, 1967 LDSMINAB, LDSMINAH, LDSMINAW, LDSMINAX, 1968 LDSMINLB, LDSMINLH, LDSMINLW, LDSMINLX, 1969 LDSMINALB, LDSMINALH, LDSMINALW, LDSMINALX)>; 1970 1971def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1972 (instrs LDUMAXB, LDUMAXH, LDUMAXW, LDUMAXX, 1973 LDUMAXAB, LDUMAXAH, LDUMAXAW, LDUMAXAX, 1974 LDUMAXLB, LDUMAXLH, LDUMAXLW, LDUMAXLX, 1975 LDUMAXALB, LDUMAXALH, LDUMAXALW, LDUMAXALX)>; 1976 1977def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1978 (instrs LDUMINB, LDUMINH, LDUMINW, LDUMINX, 1979 LDUMINAB, LDUMINAH, LDUMINAW, LDUMINAX, 1980 LDUMINLB, LDUMINLH, LDUMINLW, LDUMINLX, 1981 LDUMINALB, LDUMINALH, LDUMINALW, LDUMINALX)>; 1982 1983def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1984 (instrs SWPB, SWPH, SWPW, SWPX)>; 1985 1986def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1987 (instrs SWPAB, SWPAH, SWPAW, SWPAX)>; 1988 1989def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic], 1990 (instrs SWPLB, SWPLH, SWPLW, SWPLX)>; 1991 1992def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic], 1993 (instrs SWPALB, SWPALH, SWPALW, SWPALX)>; 1994 1995def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic], 1996 (instrs STLLRB, STLLRH, STLLRW, STLLRX)>; 1997 1998// V8.3a PAC 1999def : InstRW<[THX3T110Write_11Cyc_LS01_I1], (instregex "^LDRAA", "^LDRAB")>; 2000def : InstRW<[THX3T110Write_8Cyc_I123], 2001 (instrs BLRAA, BLRAAZ, BLRAB, BLRABZ, 2002 BRAA, BRAAZ, BRAB, BRABZ)>; 2003def : InstRW<[THX3T110Write_8Cyc_I123], (instrs RETAA, RETAB)>; 2004 2005} // SchedModel = ThunderX3T110Model 2006