1 // SPDX-License-Identifier: GPL-2.0 2 /* 3 * This file contains instructions for testing by the test titled: 4 * 5 * "Test x86 instruction decoder - new instructions" 6 * 7 * Note that the 'Expecting' comment lines are consumed by the 8 * gen-insn-x86-dat.awk script and have the format: 9 * 10 * Expecting: <op> <branch> <rel> 11 * 12 * If this file is changed, remember to run the gen-insn-x86-dat.sh 13 * script and commit the result. 14 * 15 * Refer to insn-x86.c for more details. 16 */ 17 18 int main(void) 19 { 20 /* Following line is a marker for the awk script - do not change */ 21 asm volatile("rdtsc"); /* Start here */ 22 23 /* Test fix for vcvtph2ps in x86-opcode-map.txt */ 24 25 asm volatile("vcvtph2ps %xmm3,%ymm5"); 26 27 #ifdef __x86_64__ 28 29 /* AVX-512: Instructions with the same op codes as Mask Instructions */ 30 31 asm volatile("cmovno %rax,%rbx"); 32 asm volatile("cmovno 0x12345678(%rax),%rcx"); 33 asm volatile("cmovno 0x12345678(%rax),%cx"); 34 35 asm volatile("cmove %rax,%rbx"); 36 asm volatile("cmove 0x12345678(%rax),%rcx"); 37 asm volatile("cmove 0x12345678(%rax),%cx"); 38 39 asm volatile("seto 0x12345678(%rax)"); 40 asm volatile("setno 0x12345678(%rax)"); 41 asm volatile("setb 0x12345678(%rax)"); 42 asm volatile("setc 0x12345678(%rax)"); 43 asm volatile("setnae 0x12345678(%rax)"); 44 asm volatile("setae 0x12345678(%rax)"); 45 asm volatile("setnb 0x12345678(%rax)"); 46 asm volatile("setnc 0x12345678(%rax)"); 47 asm volatile("sets 0x12345678(%rax)"); 48 asm volatile("setns 0x12345678(%rax)"); 49 50 /* AVX-512: Mask Instructions */ 51 52 asm volatile("kandw %k7,%k6,%k5"); 53 asm volatile("kandq %k7,%k6,%k5"); 54 asm volatile("kandb %k7,%k6,%k5"); 55 asm volatile("kandd %k7,%k6,%k5"); 56 57 asm volatile("kandnw %k7,%k6,%k5"); 58 asm volatile("kandnq %k7,%k6,%k5"); 59 asm volatile("kandnb %k7,%k6,%k5"); 60 asm volatile("kandnd %k7,%k6,%k5"); 61 62 asm volatile("knotw %k7,%k6"); 63 asm volatile("knotq %k7,%k6"); 64 asm volatile("knotb %k7,%k6"); 65 asm volatile("knotd %k7,%k6"); 66 67 asm volatile("korw %k7,%k6,%k5"); 68 asm volatile("korq %k7,%k6,%k5"); 69 asm volatile("korb %k7,%k6,%k5"); 70 asm volatile("kord %k7,%k6,%k5"); 71 72 asm volatile("kxnorw %k7,%k6,%k5"); 73 asm volatile("kxnorq %k7,%k6,%k5"); 74 asm volatile("kxnorb %k7,%k6,%k5"); 75 asm volatile("kxnord %k7,%k6,%k5"); 76 77 asm volatile("kxorw %k7,%k6,%k5"); 78 asm volatile("kxorq %k7,%k6,%k5"); 79 asm volatile("kxorb %k7,%k6,%k5"); 80 asm volatile("kxord %k7,%k6,%k5"); 81 82 asm volatile("kaddw %k7,%k6,%k5"); 83 asm volatile("kaddq %k7,%k6,%k5"); 84 asm volatile("kaddb %k7,%k6,%k5"); 85 asm volatile("kaddd %k7,%k6,%k5"); 86 87 asm volatile("kunpckbw %k7,%k6,%k5"); 88 asm volatile("kunpckwd %k7,%k6,%k5"); 89 asm volatile("kunpckdq %k7,%k6,%k5"); 90 91 asm volatile("kmovw %k6,%k5"); 92 asm volatile("kmovw (%rcx),%k5"); 93 asm volatile("kmovw 0x123(%rax,%r14,8),%k5"); 94 asm volatile("kmovw %k5,(%rcx)"); 95 asm volatile("kmovw %k5,0x123(%rax,%r14,8)"); 96 asm volatile("kmovw %eax,%k5"); 97 asm volatile("kmovw %ebp,%k5"); 98 asm volatile("kmovw %r13d,%k5"); 99 asm volatile("kmovw %k5,%eax"); 100 asm volatile("kmovw %k5,%ebp"); 101 asm volatile("kmovw %k5,%r13d"); 102 103 asm volatile("kmovq %k6,%k5"); 104 asm volatile("kmovq (%rcx),%k5"); 105 asm volatile("kmovq 0x123(%rax,%r14,8),%k5"); 106 asm volatile("kmovq %k5,(%rcx)"); 107 asm volatile("kmovq %k5,0x123(%rax,%r14,8)"); 108 asm volatile("kmovq %rax,%k5"); 109 asm volatile("kmovq %rbp,%k5"); 110 asm volatile("kmovq %r13,%k5"); 111 asm volatile("kmovq %k5,%rax"); 112 asm volatile("kmovq %k5,%rbp"); 113 asm volatile("kmovq %k5,%r13"); 114 115 asm volatile("kmovb %k6,%k5"); 116 asm volatile("kmovb (%rcx),%k5"); 117 asm volatile("kmovb 0x123(%rax,%r14,8),%k5"); 118 asm volatile("kmovb %k5,(%rcx)"); 119 asm volatile("kmovb %k5,0x123(%rax,%r14,8)"); 120 asm volatile("kmovb %eax,%k5"); 121 asm volatile("kmovb %ebp,%k5"); 122 asm volatile("kmovb %r13d,%k5"); 123 asm volatile("kmovb %k5,%eax"); 124 asm volatile("kmovb %k5,%ebp"); 125 asm volatile("kmovb %k5,%r13d"); 126 127 asm volatile("kmovd %k6,%k5"); 128 asm volatile("kmovd (%rcx),%k5"); 129 asm volatile("kmovd 0x123(%rax,%r14,8),%k5"); 130 asm volatile("kmovd %k5,(%rcx)"); 131 asm volatile("kmovd %k5,0x123(%rax,%r14,8)"); 132 asm volatile("kmovd %eax,%k5"); 133 asm volatile("kmovd %ebp,%k5"); 134 asm volatile("kmovd %r13d,%k5"); 135 asm volatile("kmovd %k5,%eax"); 136 asm volatile("kmovd %k5,%ebp"); 137 asm volatile("kmovd %k5,%r13d"); 138 139 asm volatile("kortestw %k6,%k5"); 140 asm volatile("kortestq %k6,%k5"); 141 asm volatile("kortestb %k6,%k5"); 142 asm volatile("kortestd %k6,%k5"); 143 144 asm volatile("ktestw %k6,%k5"); 145 asm volatile("ktestq %k6,%k5"); 146 asm volatile("ktestb %k6,%k5"); 147 asm volatile("ktestd %k6,%k5"); 148 149 asm volatile("kshiftrw $0x12,%k6,%k5"); 150 asm volatile("kshiftrq $0x5b,%k6,%k5"); 151 asm volatile("kshiftlw $0x12,%k6,%k5"); 152 asm volatile("kshiftlq $0x5b,%k6,%k5"); 153 154 /* AVX-512: Op code 0f 5b */ 155 asm volatile("vcvtdq2ps %xmm5,%xmm6"); 156 asm volatile("vcvtqq2ps %zmm29,%ymm6{%k7}"); 157 asm volatile("vcvtps2dq %xmm5,%xmm6"); 158 asm volatile("vcvttps2dq %xmm5,%xmm6"); 159 160 /* AVX-512: Op code 0f 6f */ 161 162 asm volatile("movq %mm0,%mm4"); 163 asm volatile("vmovdqa %ymm4,%ymm6"); 164 asm volatile("vmovdqa32 %zmm25,%zmm26"); 165 asm volatile("vmovdqa64 %zmm25,%zmm26"); 166 asm volatile("vmovdqu %ymm4,%ymm6"); 167 asm volatile("vmovdqu32 %zmm29,%zmm30"); 168 asm volatile("vmovdqu64 %zmm25,%zmm26"); 169 asm volatile("vmovdqu8 %zmm29,%zmm30"); 170 asm volatile("vmovdqu16 %zmm25,%zmm26"); 171 172 /* AVX-512: Op code 0f 78 */ 173 174 asm volatile("vmread %rax,%rbx"); 175 asm volatile("vcvttps2udq %zmm25,%zmm26"); 176 asm volatile("vcvttpd2udq %zmm29,%ymm6{%k7}"); 177 asm volatile("vcvttsd2usi %xmm6,%rax"); 178 asm volatile("vcvttss2usi %xmm6,%rax"); 179 asm volatile("vcvttps2uqq %ymm5,%zmm26{%k7}"); 180 asm volatile("vcvttpd2uqq %zmm29,%zmm30"); 181 182 /* AVX-512: Op code 0f 79 */ 183 184 asm volatile("vmwrite %rax,%rbx"); 185 asm volatile("vcvtps2udq %zmm25,%zmm26"); 186 asm volatile("vcvtpd2udq %zmm29,%ymm6{%k7}"); 187 asm volatile("vcvtsd2usi %xmm6,%rax"); 188 asm volatile("vcvtss2usi %xmm6,%rax"); 189 asm volatile("vcvtps2uqq %ymm5,%zmm26{%k7}"); 190 asm volatile("vcvtpd2uqq %zmm29,%zmm30"); 191 192 /* AVX-512: Op code 0f 7a */ 193 194 asm volatile("vcvtudq2pd %ymm5,%zmm29{%k7}"); 195 asm volatile("vcvtuqq2pd %zmm25,%zmm26"); 196 asm volatile("vcvtudq2ps %zmm29,%zmm30"); 197 asm volatile("vcvtuqq2ps %zmm25,%ymm26{%k7}"); 198 asm volatile("vcvttps2qq %ymm25,%zmm26{%k7}"); 199 asm volatile("vcvttpd2qq %zmm29,%zmm30"); 200 201 /* AVX-512: Op code 0f 7b */ 202 203 asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 204 asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 205 asm volatile("vcvtps2qq %ymm5,%zmm26{%k7}"); 206 asm volatile("vcvtpd2qq %zmm29,%zmm30"); 207 208 /* AVX-512: Op code 0f 7f */ 209 210 asm volatile("movq.s %mm0,%mm4"); 211 asm volatile("vmovdqa %ymm8,%ymm6"); 212 asm volatile("vmovdqa32.s %zmm25,%zmm26"); 213 asm volatile("vmovdqa64.s %zmm25,%zmm26"); 214 asm volatile("vmovdqu %ymm8,%ymm6"); 215 asm volatile("vmovdqu32.s %zmm25,%zmm26"); 216 asm volatile("vmovdqu64.s %zmm25,%zmm26"); 217 asm volatile("vmovdqu8.s %zmm30,(%rcx)"); 218 asm volatile("vmovdqu16.s %zmm25,%zmm26"); 219 220 /* AVX-512: Op code 0f db */ 221 222 asm volatile("pand %mm1,%mm2"); 223 asm volatile("pand %xmm1,%xmm2"); 224 asm volatile("vpand %ymm4,%ymm6,%ymm2"); 225 asm volatile("vpandd %zmm24,%zmm25,%zmm26"); 226 asm volatile("vpandq %zmm24,%zmm25,%zmm26"); 227 228 /* AVX-512: Op code 0f df */ 229 230 asm volatile("pandn %mm1,%mm2"); 231 asm volatile("pandn %xmm1,%xmm2"); 232 asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 233 asm volatile("vpandnd %zmm24,%zmm25,%zmm26"); 234 asm volatile("vpandnq %zmm24,%zmm25,%zmm26"); 235 236 /* AVX-512: Op code 0f e6 */ 237 238 asm volatile("vcvttpd2dq %xmm1,%xmm2"); 239 asm volatile("vcvtdq2pd %xmm5,%xmm6"); 240 asm volatile("vcvtdq2pd %ymm5,%zmm26{%k7}"); 241 asm volatile("vcvtqq2pd %zmm25,%zmm26"); 242 asm volatile("vcvtpd2dq %xmm1,%xmm2"); 243 244 /* AVX-512: Op code 0f eb */ 245 246 asm volatile("por %mm4,%mm6"); 247 asm volatile("vpor %ymm4,%ymm6,%ymm2"); 248 asm volatile("vpord %zmm24,%zmm25,%zmm26"); 249 asm volatile("vporq %zmm24,%zmm25,%zmm26"); 250 251 /* AVX-512: Op code 0f ef */ 252 253 asm volatile("pxor %mm4,%mm6"); 254 asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 255 asm volatile("vpxord %zmm24,%zmm25,%zmm26"); 256 asm volatile("vpxorq %zmm24,%zmm25,%zmm26"); 257 258 /* AVX-512: Op code 0f 38 10 */ 259 260 asm volatile("pblendvb %xmm1,%xmm0"); 261 asm volatile("vpsrlvw %zmm27,%zmm28,%zmm29"); 262 asm volatile("vpmovuswb %zmm28,%ymm6{%k7}"); 263 264 /* AVX-512: Op code 0f 38 11 */ 265 266 asm volatile("vpmovusdb %zmm28,%xmm6{%k7}"); 267 asm volatile("vpsravw %zmm27,%zmm28,%zmm29"); 268 269 /* AVX-512: Op code 0f 38 12 */ 270 271 asm volatile("vpmovusqb %zmm27,%xmm6{%k7}"); 272 asm volatile("vpsllvw %zmm27,%zmm28,%zmm29"); 273 274 /* AVX-512: Op code 0f 38 13 */ 275 276 asm volatile("vcvtph2ps %xmm3,%ymm5"); 277 asm volatile("vcvtph2ps %ymm5,%zmm27{%k7}"); 278 asm volatile("vpmovusdw %zmm27,%ymm6{%k7}"); 279 280 /* AVX-512: Op code 0f 38 14 */ 281 282 asm volatile("blendvps %xmm1,%xmm0"); 283 asm volatile("vpmovusqw %zmm27,%xmm6{%k7}"); 284 asm volatile("vprorvd %zmm27,%zmm28,%zmm29"); 285 asm volatile("vprorvq %zmm27,%zmm28,%zmm29"); 286 287 /* AVX-512: Op code 0f 38 15 */ 288 289 asm volatile("blendvpd %xmm1,%xmm0"); 290 asm volatile("vpmovusqd %zmm27,%ymm6{%k7}"); 291 asm volatile("vprolvd %zmm27,%zmm28,%zmm29"); 292 asm volatile("vprolvq %zmm27,%zmm28,%zmm29"); 293 294 /* AVX-512: Op code 0f 38 16 */ 295 296 asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 297 asm volatile("vpermps %ymm24,%ymm26,%ymm22{%k7}"); 298 asm volatile("vpermpd %ymm24,%ymm26,%ymm22{%k7}"); 299 300 /* AVX-512: Op code 0f 38 19 */ 301 302 asm volatile("vbroadcastsd %xmm4,%ymm6"); 303 asm volatile("vbroadcastf32x2 %xmm27,%zmm26"); 304 305 /* AVX-512: Op code 0f 38 1a */ 306 307 asm volatile("vbroadcastf128 (%rcx),%ymm4"); 308 asm volatile("vbroadcastf32x4 (%rcx),%zmm26"); 309 asm volatile("vbroadcastf64x2 (%rcx),%zmm26"); 310 311 /* AVX-512: Op code 0f 38 1b */ 312 313 asm volatile("vbroadcastf32x8 (%rcx),%zmm27"); 314 asm volatile("vbroadcastf64x4 (%rcx),%zmm26"); 315 316 /* AVX-512: Op code 0f 38 1f */ 317 318 asm volatile("vpabsq %zmm27,%zmm28"); 319 320 /* AVX-512: Op code 0f 38 20 */ 321 322 asm volatile("vpmovsxbw %xmm4,%xmm5"); 323 asm volatile("vpmovswb %zmm27,%ymm6{%k7}"); 324 325 /* AVX-512: Op code 0f 38 21 */ 326 327 asm volatile("vpmovsxbd %xmm4,%ymm6"); 328 asm volatile("vpmovsdb %zmm27,%xmm6{%k7}"); 329 330 /* AVX-512: Op code 0f 38 22 */ 331 332 asm volatile("vpmovsxbq %xmm4,%ymm4"); 333 asm volatile("vpmovsqb %zmm27,%xmm6{%k7}"); 334 335 /* AVX-512: Op code 0f 38 23 */ 336 337 asm volatile("vpmovsxwd %xmm4,%ymm4"); 338 asm volatile("vpmovsdw %zmm27,%ymm6{%k7}"); 339 340 /* AVX-512: Op code 0f 38 24 */ 341 342 asm volatile("vpmovsxwq %xmm4,%ymm6"); 343 asm volatile("vpmovsqw %zmm27,%xmm6{%k7}"); 344 345 /* AVX-512: Op code 0f 38 25 */ 346 347 asm volatile("vpmovsxdq %xmm4,%ymm4"); 348 asm volatile("vpmovsqd %zmm27,%ymm6{%k7}"); 349 350 /* AVX-512: Op code 0f 38 26 */ 351 352 asm volatile("vptestmb %zmm27,%zmm28,%k5"); 353 asm volatile("vptestmw %zmm27,%zmm28,%k5"); 354 asm volatile("vptestnmb %zmm26,%zmm27,%k5"); 355 asm volatile("vptestnmw %zmm26,%zmm27,%k5"); 356 357 /* AVX-512: Op code 0f 38 27 */ 358 359 asm volatile("vptestmd %zmm27,%zmm28,%k5"); 360 asm volatile("vptestmq %zmm27,%zmm28,%k5"); 361 asm volatile("vptestnmd %zmm26,%zmm27,%k5"); 362 asm volatile("vptestnmq %zmm26,%zmm27,%k5"); 363 364 /* AVX-512: Op code 0f 38 28 */ 365 366 asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 367 asm volatile("vpmovm2b %k5,%zmm28"); 368 asm volatile("vpmovm2w %k5,%zmm28"); 369 370 /* AVX-512: Op code 0f 38 29 */ 371 372 asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 373 asm volatile("vpmovb2m %zmm28,%k5"); 374 asm volatile("vpmovw2m %zmm28,%k5"); 375 376 /* AVX-512: Op code 0f 38 2a */ 377 378 asm volatile("vmovntdqa (%rcx),%ymm4"); 379 asm volatile("vpbroadcastmb2q %k6,%zmm30"); 380 381 /* AVX-512: Op code 0f 38 2c */ 382 383 asm volatile("vmaskmovps (%rcx),%ymm4,%ymm6"); 384 asm volatile("vscalefps %zmm24,%zmm25,%zmm26"); 385 asm volatile("vscalefpd %zmm24,%zmm25,%zmm26"); 386 387 /* AVX-512: Op code 0f 38 2d */ 388 389 asm volatile("vmaskmovpd (%rcx),%ymm4,%ymm6"); 390 asm volatile("vscalefss %xmm24,%xmm25,%xmm26{%k7}"); 391 asm volatile("vscalefsd %xmm24,%xmm25,%xmm26{%k7}"); 392 393 /* AVX-512: Op code 0f 38 30 */ 394 395 asm volatile("vpmovzxbw %xmm4,%ymm4"); 396 asm volatile("vpmovwb %zmm27,%ymm6{%k7}"); 397 398 /* AVX-512: Op code 0f 38 31 */ 399 400 asm volatile("vpmovzxbd %xmm4,%ymm6"); 401 asm volatile("vpmovdb %zmm27,%xmm6{%k7}"); 402 403 /* AVX-512: Op code 0f 38 32 */ 404 405 asm volatile("vpmovzxbq %xmm4,%ymm4"); 406 asm volatile("vpmovqb %zmm27,%xmm6{%k7}"); 407 408 /* AVX-512: Op code 0f 38 33 */ 409 410 asm volatile("vpmovzxwd %xmm4,%ymm4"); 411 asm volatile("vpmovdw %zmm27,%ymm6{%k7}"); 412 413 /* AVX-512: Op code 0f 38 34 */ 414 415 asm volatile("vpmovzxwq %xmm4,%ymm6"); 416 asm volatile("vpmovqw %zmm27,%xmm6{%k7}"); 417 418 /* AVX-512: Op code 0f 38 35 */ 419 420 asm volatile("vpmovzxdq %xmm4,%ymm4"); 421 asm volatile("vpmovqd %zmm27,%ymm6{%k7}"); 422 423 /* AVX-512: Op code 0f 38 38 */ 424 425 asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 426 asm volatile("vpermd %ymm24,%ymm26,%ymm22{%k7}"); 427 asm volatile("vpermq %ymm24,%ymm26,%ymm22{%k7}"); 428 429 /* AVX-512: Op code 0f 38 38 */ 430 431 asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 432 asm volatile("vpmovm2d %k5,%zmm28"); 433 asm volatile("vpmovm2q %k5,%zmm28"); 434 435 /* AVX-512: Op code 0f 38 39 */ 436 437 asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 438 asm volatile("vpminsd %zmm24,%zmm25,%zmm26"); 439 asm volatile("vpminsq %zmm24,%zmm25,%zmm26"); 440 asm volatile("vpmovd2m %zmm28,%k5"); 441 asm volatile("vpmovq2m %zmm28,%k5"); 442 443 /* AVX-512: Op code 0f 38 3a */ 444 445 asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 446 asm volatile("vpbroadcastmw2d %k6,%zmm28"); 447 448 /* AVX-512: Op code 0f 38 3b */ 449 450 asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 451 asm volatile("vpminud %zmm24,%zmm25,%zmm26"); 452 asm volatile("vpminuq %zmm24,%zmm25,%zmm26"); 453 454 /* AVX-512: Op code 0f 38 3d */ 455 456 asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 457 asm volatile("vpmaxsd %zmm24,%zmm25,%zmm26"); 458 asm volatile("vpmaxsq %zmm24,%zmm25,%zmm26"); 459 460 /* AVX-512: Op code 0f 38 3f */ 461 462 asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 463 asm volatile("vpmaxud %zmm24,%zmm25,%zmm26"); 464 asm volatile("vpmaxuq %zmm24,%zmm25,%zmm26"); 465 466 /* AVX-512: Op code 0f 38 42 */ 467 468 asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 469 asm volatile("vpmulld %zmm24,%zmm25,%zmm26"); 470 asm volatile("vpmullq %zmm24,%zmm25,%zmm26"); 471 472 /* AVX-512: Op code 0f 38 42 */ 473 474 asm volatile("vgetexpps %zmm25,%zmm26"); 475 asm volatile("vgetexppd %zmm27,%zmm28"); 476 477 /* AVX-512: Op code 0f 38 43 */ 478 479 asm volatile("vgetexpss %xmm24,%xmm25,%xmm26{%k7}"); 480 asm volatile("vgetexpsd %xmm28,%xmm29,%xmm30{%k7}"); 481 482 /* AVX-512: Op code 0f 38 44 */ 483 484 asm volatile("vplzcntd %zmm27,%zmm28"); 485 asm volatile("vplzcntq %zmm27,%zmm28"); 486 487 /* AVX-512: Op code 0f 38 46 */ 488 489 asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 490 asm volatile("vpsravd %zmm24,%zmm25,%zmm26"); 491 asm volatile("vpsravq %zmm24,%zmm25,%zmm26"); 492 493 /* AVX-512: Op code 0f 38 4c */ 494 495 asm volatile("vrcp14ps %zmm25,%zmm26"); 496 asm volatile("vrcp14pd %zmm27,%zmm28"); 497 498 /* AVX-512: Op code 0f 38 4d */ 499 500 asm volatile("vrcp14ss %xmm24,%xmm25,%xmm26{%k7}"); 501 asm volatile("vrcp14sd %xmm24,%xmm25,%xmm26{%k7}"); 502 503 /* AVX-512: Op code 0f 38 4e */ 504 505 asm volatile("vrsqrt14ps %zmm25,%zmm26"); 506 asm volatile("vrsqrt14pd %zmm27,%zmm28"); 507 508 /* AVX-512: Op code 0f 38 4f */ 509 510 asm volatile("vrsqrt14ss %xmm24,%xmm25,%xmm26{%k7}"); 511 asm volatile("vrsqrt14sd %xmm24,%xmm25,%xmm26{%k7}"); 512 513 /* AVX-512: Op code 0f 38 59 */ 514 515 asm volatile("vpbroadcastq %xmm4,%xmm6"); 516 asm volatile("vbroadcasti32x2 %xmm27,%zmm26"); 517 518 /* AVX-512: Op code 0f 38 5a */ 519 520 asm volatile("vbroadcasti128 (%rcx),%ymm4"); 521 asm volatile("vbroadcasti32x4 (%rcx),%zmm26"); 522 asm volatile("vbroadcasti64x2 (%rcx),%zmm26"); 523 524 /* AVX-512: Op code 0f 38 5b */ 525 526 asm volatile("vbroadcasti32x8 (%rcx),%zmm28"); 527 asm volatile("vbroadcasti64x4 (%rcx),%zmm26"); 528 529 /* AVX-512: Op code 0f 38 64 */ 530 531 asm volatile("vpblendmd %zmm26,%zmm27,%zmm28"); 532 asm volatile("vpblendmq %zmm26,%zmm27,%zmm28"); 533 534 /* AVX-512: Op code 0f 38 65 */ 535 536 asm volatile("vblendmps %zmm24,%zmm25,%zmm26"); 537 asm volatile("vblendmpd %zmm26,%zmm27,%zmm28"); 538 539 /* AVX-512: Op code 0f 38 66 */ 540 541 asm volatile("vpblendmb %zmm26,%zmm27,%zmm28"); 542 asm volatile("vpblendmw %zmm26,%zmm27,%zmm28"); 543 544 /* AVX-512: Op code 0f 38 75 */ 545 546 asm volatile("vpermi2b %zmm24,%zmm25,%zmm26"); 547 asm volatile("vpermi2w %zmm26,%zmm27,%zmm28"); 548 549 /* AVX-512: Op code 0f 38 76 */ 550 551 asm volatile("vpermi2d %zmm26,%zmm27,%zmm28"); 552 asm volatile("vpermi2q %zmm26,%zmm27,%zmm28"); 553 554 /* AVX-512: Op code 0f 38 77 */ 555 556 asm volatile("vpermi2ps %zmm26,%zmm27,%zmm28"); 557 asm volatile("vpermi2pd %zmm26,%zmm27,%zmm28"); 558 559 /* AVX-512: Op code 0f 38 7a */ 560 561 asm volatile("vpbroadcastb %eax,%xmm30"); 562 563 /* AVX-512: Op code 0f 38 7b */ 564 565 asm volatile("vpbroadcastw %eax,%xmm30"); 566 567 /* AVX-512: Op code 0f 38 7c */ 568 569 asm volatile("vpbroadcastd %eax,%xmm30"); 570 asm volatile("vpbroadcastq %rax,%zmm30"); 571 572 /* AVX-512: Op code 0f 38 7d */ 573 574 asm volatile("vpermt2b %zmm26,%zmm27,%zmm28"); 575 asm volatile("vpermt2w %zmm26,%zmm27,%zmm28"); 576 577 /* AVX-512: Op code 0f 38 7e */ 578 579 asm volatile("vpermt2d %zmm26,%zmm27,%zmm28"); 580 asm volatile("vpermt2q %zmm26,%zmm27,%zmm28"); 581 582 /* AVX-512: Op code 0f 38 7f */ 583 584 asm volatile("vpermt2ps %zmm26,%zmm27,%zmm28"); 585 asm volatile("vpermt2pd %zmm26,%zmm27,%zmm28"); 586 587 /* AVX-512: Op code 0f 38 83 */ 588 589 asm volatile("vpmultishiftqb %zmm26,%zmm27,%zmm28"); 590 591 /* AVX-512: Op code 0f 38 88 */ 592 593 asm volatile("vexpandps (%rcx),%zmm26"); 594 asm volatile("vexpandpd (%rcx),%zmm28"); 595 596 /* AVX-512: Op code 0f 38 89 */ 597 598 asm volatile("vpexpandd (%rcx),%zmm28"); 599 asm volatile("vpexpandq (%rcx),%zmm26"); 600 601 /* AVX-512: Op code 0f 38 8a */ 602 603 asm volatile("vcompressps %zmm28,(%rcx)"); 604 asm volatile("vcompresspd %zmm28,(%rcx)"); 605 606 /* AVX-512: Op code 0f 38 8b */ 607 608 asm volatile("vpcompressd %zmm28,(%rcx)"); 609 asm volatile("vpcompressq %zmm26,(%rcx)"); 610 611 /* AVX-512: Op code 0f 38 8d */ 612 613 asm volatile("vpermb %zmm26,%zmm27,%zmm28"); 614 asm volatile("vpermw %zmm26,%zmm27,%zmm28"); 615 616 /* AVX-512: Op code 0f 38 90 */ 617 618 asm volatile("vpgatherdd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 619 asm volatile("vpgatherdq %xmm2,0x04(%rbp,%xmm7,2),%xmm1"); 620 asm volatile("vpgatherdd 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 621 asm volatile("vpgatherdq 0x7b(%rbp,%ymm27,8),%zmm26{%k1}"); 622 623 /* AVX-512: Op code 0f 38 91 */ 624 625 asm volatile("vpgatherqd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 626 asm volatile("vpgatherqq %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 627 asm volatile("vpgatherqd 0x7b(%rbp,%zmm27,8),%ymm26{%k1}"); 628 asm volatile("vpgatherqq 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 629 630 /* AVX-512: Op code 0f 38 a0 */ 631 632 asm volatile("vpscatterdd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 633 asm volatile("vpscatterdq %zmm26,0x7b(%rbp,%ymm27,8){%k1}"); 634 635 /* AVX-512: Op code 0f 38 a1 */ 636 637 asm volatile("vpscatterqd %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 638 asm volatile("vpscatterqq %ymm6,0x7b(%rbp,%ymm27,8){%k1}"); 639 640 /* AVX-512: Op code 0f 38 a2 */ 641 642 asm volatile("vscatterdps %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 643 asm volatile("vscatterdpd %zmm28,0x7b(%rbp,%ymm27,8){%k1}"); 644 645 /* AVX-512: Op code 0f 38 a3 */ 646 647 asm volatile("vscatterqps %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 648 asm volatile("vscatterqpd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 649 650 /* AVX-512: Op code 0f 38 b4 */ 651 652 asm volatile("vpmadd52luq %zmm26,%zmm27,%zmm28"); 653 654 /* AVX-512: Op code 0f 38 b5 */ 655 656 asm volatile("vpmadd52huq %zmm26,%zmm27,%zmm28"); 657 658 /* AVX-512: Op code 0f 38 c4 */ 659 660 asm volatile("vpconflictd %zmm26,%zmm27"); 661 asm volatile("vpconflictq %zmm26,%zmm27"); 662 663 /* AVX-512: Op code 0f 38 c8 */ 664 665 asm volatile("vexp2ps %zmm29,%zmm30"); 666 asm volatile("vexp2pd %zmm26,%zmm27"); 667 668 /* AVX-512: Op code 0f 38 ca */ 669 670 asm volatile("vrcp28ps %zmm29,%zmm30"); 671 asm volatile("vrcp28pd %zmm26,%zmm27"); 672 673 /* AVX-512: Op code 0f 38 cb */ 674 675 asm volatile("vrcp28ss %xmm28,%xmm29,%xmm30{%k7}"); 676 asm volatile("vrcp28sd %xmm25,%xmm26,%xmm27{%k7}"); 677 678 /* AVX-512: Op code 0f 38 cc */ 679 680 asm volatile("vrsqrt28ps %zmm29,%zmm30"); 681 asm volatile("vrsqrt28pd %zmm26,%zmm27"); 682 683 /* AVX-512: Op code 0f 38 cd */ 684 685 asm volatile("vrsqrt28ss %xmm28,%xmm29,%xmm30{%k7}"); 686 asm volatile("vrsqrt28sd %xmm25,%xmm26,%xmm27{%k7}"); 687 688 /* AVX-512: Op code 0f 3a 03 */ 689 690 asm volatile("valignd $0x12,%zmm28,%zmm29,%zmm30"); 691 asm volatile("valignq $0x12,%zmm25,%zmm26,%zmm27"); 692 693 /* AVX-512: Op code 0f 3a 08 */ 694 695 asm volatile("vroundps $0x5,%ymm6,%ymm2"); 696 asm volatile("vrndscaleps $0x12,%zmm25,%zmm26"); 697 698 /* AVX-512: Op code 0f 3a 09 */ 699 700 asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 701 asm volatile("vrndscalepd $0x12,%zmm25,%zmm26"); 702 703 /* AVX-512: Op code 0f 3a 1a */ 704 705 asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 706 asm volatile("vrndscaless $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 707 708 /* AVX-512: Op code 0f 3a 0b */ 709 710 asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 711 asm volatile("vrndscalesd $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 712 713 /* AVX-512: Op code 0f 3a 18 */ 714 715 asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 716 asm volatile("vinsertf32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 717 asm volatile("vinsertf64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 718 719 /* AVX-512: Op code 0f 3a 19 */ 720 721 asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 722 asm volatile("vextractf32x4 $0x12,%zmm25,%xmm26{%k7}"); 723 asm volatile("vextractf64x2 $0x12,%zmm25,%xmm26{%k7}"); 724 725 /* AVX-512: Op code 0f 3a 1a */ 726 727 asm volatile("vinsertf32x8 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 728 asm volatile("vinsertf64x4 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 729 730 /* AVX-512: Op code 0f 3a 1b */ 731 732 asm volatile("vextractf32x8 $0x12,%zmm29,%ymm30{%k7}"); 733 asm volatile("vextractf64x4 $0x12,%zmm26,%ymm27{%k7}"); 734 735 /* AVX-512: Op code 0f 3a 1e */ 736 737 asm volatile("vpcmpud $0x12,%zmm29,%zmm30,%k5"); 738 asm volatile("vpcmpuq $0x12,%zmm26,%zmm27,%k5"); 739 740 /* AVX-512: Op code 0f 3a 1f */ 741 742 asm volatile("vpcmpd $0x12,%zmm29,%zmm30,%k5"); 743 asm volatile("vpcmpq $0x12,%zmm26,%zmm27,%k5"); 744 745 /* AVX-512: Op code 0f 3a 23 */ 746 747 asm volatile("vshuff32x4 $0x12,%zmm28,%zmm29,%zmm30"); 748 asm volatile("vshuff64x2 $0x12,%zmm25,%zmm26,%zmm27"); 749 750 /* AVX-512: Op code 0f 3a 25 */ 751 752 asm volatile("vpternlogd $0x12,%zmm28,%zmm29,%zmm30"); 753 asm volatile("vpternlogq $0x12,%zmm28,%zmm29,%zmm30"); 754 755 /* AVX-512: Op code 0f 3a 26 */ 756 757 asm volatile("vgetmantps $0x12,%zmm26,%zmm27"); 758 asm volatile("vgetmantpd $0x12,%zmm29,%zmm30"); 759 760 /* AVX-512: Op code 0f 3a 27 */ 761 762 asm volatile("vgetmantss $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 763 asm volatile("vgetmantsd $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 764 765 /* AVX-512: Op code 0f 3a 38 */ 766 767 asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 768 asm volatile("vinserti32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 769 asm volatile("vinserti64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 770 771 /* AVX-512: Op code 0f 3a 39 */ 772 773 asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 774 asm volatile("vextracti32x4 $0x12,%zmm25,%xmm26{%k7}"); 775 asm volatile("vextracti64x2 $0x12,%zmm25,%xmm26{%k7}"); 776 777 /* AVX-512: Op code 0f 3a 3a */ 778 779 asm volatile("vinserti32x8 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 780 asm volatile("vinserti64x4 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 781 782 /* AVX-512: Op code 0f 3a 3b */ 783 784 asm volatile("vextracti32x8 $0x12,%zmm29,%ymm30{%k7}"); 785 asm volatile("vextracti64x4 $0x12,%zmm26,%ymm27{%k7}"); 786 787 /* AVX-512: Op code 0f 3a 3e */ 788 789 asm volatile("vpcmpub $0x12,%zmm29,%zmm30,%k5"); 790 asm volatile("vpcmpuw $0x12,%zmm26,%zmm27,%k5"); 791 792 /* AVX-512: Op code 0f 3a 3f */ 793 794 asm volatile("vpcmpb $0x12,%zmm29,%zmm30,%k5"); 795 asm volatile("vpcmpw $0x12,%zmm26,%zmm27,%k5"); 796 797 /* AVX-512: Op code 0f 3a 43 */ 798 799 asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 800 asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 801 802 /* AVX-512: Op code 0f 3a 43 */ 803 804 asm volatile("vshufi32x4 $0x12,%zmm25,%zmm26,%zmm27"); 805 asm volatile("vshufi64x2 $0x12,%zmm28,%zmm29,%zmm30"); 806 807 /* AVX-512: Op code 0f 3a 50 */ 808 809 asm volatile("vrangeps $0x12,%zmm25,%zmm26,%zmm27"); 810 asm volatile("vrangepd $0x12,%zmm28,%zmm29,%zmm30"); 811 812 /* AVX-512: Op code 0f 3a 51 */ 813 814 asm volatile("vrangess $0x12,%xmm25,%xmm26,%xmm27"); 815 asm volatile("vrangesd $0x12,%xmm28,%xmm29,%xmm30"); 816 817 /* AVX-512: Op code 0f 3a 54 */ 818 819 asm volatile("vfixupimmps $0x12,%zmm28,%zmm29,%zmm30"); 820 asm volatile("vfixupimmpd $0x12,%zmm25,%zmm26,%zmm27"); 821 822 /* AVX-512: Op code 0f 3a 55 */ 823 824 asm volatile("vfixupimmss $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 825 asm volatile("vfixupimmsd $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 826 827 /* AVX-512: Op code 0f 3a 56 */ 828 829 asm volatile("vreduceps $0x12,%zmm26,%zmm27"); 830 asm volatile("vreducepd $0x12,%zmm29,%zmm30"); 831 832 /* AVX-512: Op code 0f 3a 57 */ 833 834 asm volatile("vreducess $0x12,%xmm25,%xmm26,%xmm27"); 835 asm volatile("vreducesd $0x12,%xmm28,%xmm29,%xmm30"); 836 837 /* AVX-512: Op code 0f 3a 66 */ 838 839 asm volatile("vfpclassps $0x12,%zmm27,%k5"); 840 asm volatile("vfpclasspd $0x12,%zmm30,%k5"); 841 842 /* AVX-512: Op code 0f 3a 67 */ 843 844 asm volatile("vfpclassss $0x12,%xmm27,%k5"); 845 asm volatile("vfpclasssd $0x12,%xmm30,%k5"); 846 847 /* AVX-512: Op code 0f 72 (Grp13) */ 848 849 asm volatile("vprord $0x12,%zmm25,%zmm26"); 850 asm volatile("vprorq $0x12,%zmm25,%zmm26"); 851 asm volatile("vprold $0x12,%zmm29,%zmm30"); 852 asm volatile("vprolq $0x12,%zmm29,%zmm30"); 853 asm volatile("psrad $0x2,%mm6"); 854 asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 855 asm volatile("vpsrad $0x5,%zmm26,%zmm22"); 856 asm volatile("vpsraq $0x5,%zmm26,%zmm22"); 857 858 /* AVX-512: Op code 0f 38 c6 (Grp18) */ 859 860 asm volatile("vgatherpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 861 asm volatile("vgatherpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 862 asm volatile("vgatherpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 863 asm volatile("vgatherpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 864 asm volatile("vscatterpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 865 asm volatile("vscatterpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 866 asm volatile("vscatterpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 867 asm volatile("vscatterpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 868 869 /* AVX-512: Op code 0f 38 c7 (Grp19) */ 870 871 asm volatile("vgatherpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 872 asm volatile("vgatherpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 873 asm volatile("vgatherpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 874 asm volatile("vgatherpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 875 asm volatile("vscatterpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 876 asm volatile("vscatterpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 877 asm volatile("vscatterpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 878 asm volatile("vscatterpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 879 880 /* AVX-512: Examples */ 881 882 asm volatile("vaddpd %zmm28,%zmm29,%zmm30"); 883 asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}"); 884 asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}{z}"); 885 asm volatile("vaddpd {rn-sae},%zmm28,%zmm29,%zmm30"); 886 asm volatile("vaddpd {ru-sae},%zmm28,%zmm29,%zmm30"); 887 asm volatile("vaddpd {rd-sae},%zmm28,%zmm29,%zmm30"); 888 asm volatile("vaddpd {rz-sae},%zmm28,%zmm29,%zmm30"); 889 asm volatile("vaddpd (%rcx),%zmm29,%zmm30"); 890 asm volatile("vaddpd 0x123(%rax,%r14,8),%zmm29,%zmm30"); 891 asm volatile("vaddpd (%rcx){1to8},%zmm29,%zmm30"); 892 asm volatile("vaddpd 0x1fc0(%rdx),%zmm29,%zmm30"); 893 asm volatile("vaddpd 0x3f8(%rdx){1to8},%zmm29,%zmm30"); 894 asm volatile("vcmpeq_uqps 0x1fc(%rdx){1to16},%zmm30,%k5"); 895 asm volatile("vcmpltsd 0x123(%rax,%r14,8),%xmm29,%k5{%k7}"); 896 asm volatile("vcmplesd {sae},%xmm28,%xmm29,%k5{%k7}"); 897 asm volatile("vgetmantss $0x5b,0x123(%rax,%r14,8),%xmm29,%xmm30{%k7}"); 898 899 /* bndmk m64, bnd */ 900 901 asm volatile("bndmk (%rax), %bnd0"); 902 asm volatile("bndmk (%r8), %bnd0"); 903 asm volatile("bndmk (0x12345678), %bnd0"); 904 asm volatile("bndmk (%rax), %bnd3"); 905 asm volatile("bndmk (%rcx,%rax,1), %bnd0"); 906 asm volatile("bndmk 0x12345678(,%rax,1), %bnd0"); 907 asm volatile("bndmk (%rax,%rcx,1), %bnd0"); 908 asm volatile("bndmk (%rax,%rcx,8), %bnd0"); 909 asm volatile("bndmk 0x12(%rax), %bnd0"); 910 asm volatile("bndmk 0x12(%rbp), %bnd0"); 911 asm volatile("bndmk 0x12(%rcx,%rax,1), %bnd0"); 912 asm volatile("bndmk 0x12(%rbp,%rax,1), %bnd0"); 913 asm volatile("bndmk 0x12(%rax,%rcx,1), %bnd0"); 914 asm volatile("bndmk 0x12(%rax,%rcx,8), %bnd0"); 915 asm volatile("bndmk 0x12345678(%rax), %bnd0"); 916 asm volatile("bndmk 0x12345678(%rbp), %bnd0"); 917 asm volatile("bndmk 0x12345678(%rcx,%rax,1), %bnd0"); 918 asm volatile("bndmk 0x12345678(%rbp,%rax,1), %bnd0"); 919 asm volatile("bndmk 0x12345678(%rax,%rcx,1), %bnd0"); 920 asm volatile("bndmk 0x12345678(%rax,%rcx,8), %bnd0"); 921 922 /* bndcl r/m64, bnd */ 923 924 asm volatile("bndcl (%rax), %bnd0"); 925 asm volatile("bndcl (%r8), %bnd0"); 926 asm volatile("bndcl (0x12345678), %bnd0"); 927 asm volatile("bndcl (%rax), %bnd3"); 928 asm volatile("bndcl (%rcx,%rax,1), %bnd0"); 929 asm volatile("bndcl 0x12345678(,%rax,1), %bnd0"); 930 asm volatile("bndcl (%rax,%rcx,1), %bnd0"); 931 asm volatile("bndcl (%rax,%rcx,8), %bnd0"); 932 asm volatile("bndcl 0x12(%rax), %bnd0"); 933 asm volatile("bndcl 0x12(%rbp), %bnd0"); 934 asm volatile("bndcl 0x12(%rcx,%rax,1), %bnd0"); 935 asm volatile("bndcl 0x12(%rbp,%rax,1), %bnd0"); 936 asm volatile("bndcl 0x12(%rax,%rcx,1), %bnd0"); 937 asm volatile("bndcl 0x12(%rax,%rcx,8), %bnd0"); 938 asm volatile("bndcl 0x12345678(%rax), %bnd0"); 939 asm volatile("bndcl 0x12345678(%rbp), %bnd0"); 940 asm volatile("bndcl 0x12345678(%rcx,%rax,1), %bnd0"); 941 asm volatile("bndcl 0x12345678(%rbp,%rax,1), %bnd0"); 942 asm volatile("bndcl 0x12345678(%rax,%rcx,1), %bnd0"); 943 asm volatile("bndcl 0x12345678(%rax,%rcx,8), %bnd0"); 944 asm volatile("bndcl %rax, %bnd0"); 945 946 /* bndcu r/m64, bnd */ 947 948 asm volatile("bndcu (%rax), %bnd0"); 949 asm volatile("bndcu (%r8), %bnd0"); 950 asm volatile("bndcu (0x12345678), %bnd0"); 951 asm volatile("bndcu (%rax), %bnd3"); 952 asm volatile("bndcu (%rcx,%rax,1), %bnd0"); 953 asm volatile("bndcu 0x12345678(,%rax,1), %bnd0"); 954 asm volatile("bndcu (%rax,%rcx,1), %bnd0"); 955 asm volatile("bndcu (%rax,%rcx,8), %bnd0"); 956 asm volatile("bndcu 0x12(%rax), %bnd0"); 957 asm volatile("bndcu 0x12(%rbp), %bnd0"); 958 asm volatile("bndcu 0x12(%rcx,%rax,1), %bnd0"); 959 asm volatile("bndcu 0x12(%rbp,%rax,1), %bnd0"); 960 asm volatile("bndcu 0x12(%rax,%rcx,1), %bnd0"); 961 asm volatile("bndcu 0x12(%rax,%rcx,8), %bnd0"); 962 asm volatile("bndcu 0x12345678(%rax), %bnd0"); 963 asm volatile("bndcu 0x12345678(%rbp), %bnd0"); 964 asm volatile("bndcu 0x12345678(%rcx,%rax,1), %bnd0"); 965 asm volatile("bndcu 0x12345678(%rbp,%rax,1), %bnd0"); 966 asm volatile("bndcu 0x12345678(%rax,%rcx,1), %bnd0"); 967 asm volatile("bndcu 0x12345678(%rax,%rcx,8), %bnd0"); 968 asm volatile("bndcu %rax, %bnd0"); 969 970 /* bndcn r/m64, bnd */ 971 972 asm volatile("bndcn (%rax), %bnd0"); 973 asm volatile("bndcn (%r8), %bnd0"); 974 asm volatile("bndcn (0x12345678), %bnd0"); 975 asm volatile("bndcn (%rax), %bnd3"); 976 asm volatile("bndcn (%rcx,%rax,1), %bnd0"); 977 asm volatile("bndcn 0x12345678(,%rax,1), %bnd0"); 978 asm volatile("bndcn (%rax,%rcx,1), %bnd0"); 979 asm volatile("bndcn (%rax,%rcx,8), %bnd0"); 980 asm volatile("bndcn 0x12(%rax), %bnd0"); 981 asm volatile("bndcn 0x12(%rbp), %bnd0"); 982 asm volatile("bndcn 0x12(%rcx,%rax,1), %bnd0"); 983 asm volatile("bndcn 0x12(%rbp,%rax,1), %bnd0"); 984 asm volatile("bndcn 0x12(%rax,%rcx,1), %bnd0"); 985 asm volatile("bndcn 0x12(%rax,%rcx,8), %bnd0"); 986 asm volatile("bndcn 0x12345678(%rax), %bnd0"); 987 asm volatile("bndcn 0x12345678(%rbp), %bnd0"); 988 asm volatile("bndcn 0x12345678(%rcx,%rax,1), %bnd0"); 989 asm volatile("bndcn 0x12345678(%rbp,%rax,1), %bnd0"); 990 asm volatile("bndcn 0x12345678(%rax,%rcx,1), %bnd0"); 991 asm volatile("bndcn 0x12345678(%rax,%rcx,8), %bnd0"); 992 asm volatile("bndcn %rax, %bnd0"); 993 994 /* bndmov m128, bnd */ 995 996 asm volatile("bndmov (%rax), %bnd0"); 997 asm volatile("bndmov (%r8), %bnd0"); 998 asm volatile("bndmov (0x12345678), %bnd0"); 999 asm volatile("bndmov (%rax), %bnd3"); 1000 asm volatile("bndmov (%rcx,%rax,1), %bnd0"); 1001 asm volatile("bndmov 0x12345678(,%rax,1), %bnd0"); 1002 asm volatile("bndmov (%rax,%rcx,1), %bnd0"); 1003 asm volatile("bndmov (%rax,%rcx,8), %bnd0"); 1004 asm volatile("bndmov 0x12(%rax), %bnd0"); 1005 asm volatile("bndmov 0x12(%rbp), %bnd0"); 1006 asm volatile("bndmov 0x12(%rcx,%rax,1), %bnd0"); 1007 asm volatile("bndmov 0x12(%rbp,%rax,1), %bnd0"); 1008 asm volatile("bndmov 0x12(%rax,%rcx,1), %bnd0"); 1009 asm volatile("bndmov 0x12(%rax,%rcx,8), %bnd0"); 1010 asm volatile("bndmov 0x12345678(%rax), %bnd0"); 1011 asm volatile("bndmov 0x12345678(%rbp), %bnd0"); 1012 asm volatile("bndmov 0x12345678(%rcx,%rax,1), %bnd0"); 1013 asm volatile("bndmov 0x12345678(%rbp,%rax,1), %bnd0"); 1014 asm volatile("bndmov 0x12345678(%rax,%rcx,1), %bnd0"); 1015 asm volatile("bndmov 0x12345678(%rax,%rcx,8), %bnd0"); 1016 1017 /* bndmov bnd, m128 */ 1018 1019 asm volatile("bndmov %bnd0, (%rax)"); 1020 asm volatile("bndmov %bnd0, (%r8)"); 1021 asm volatile("bndmov %bnd0, (0x12345678)"); 1022 asm volatile("bndmov %bnd3, (%rax)"); 1023 asm volatile("bndmov %bnd0, (%rcx,%rax,1)"); 1024 asm volatile("bndmov %bnd0, 0x12345678(,%rax,1)"); 1025 asm volatile("bndmov %bnd0, (%rax,%rcx,1)"); 1026 asm volatile("bndmov %bnd0, (%rax,%rcx,8)"); 1027 asm volatile("bndmov %bnd0, 0x12(%rax)"); 1028 asm volatile("bndmov %bnd0, 0x12(%rbp)"); 1029 asm volatile("bndmov %bnd0, 0x12(%rcx,%rax,1)"); 1030 asm volatile("bndmov %bnd0, 0x12(%rbp,%rax,1)"); 1031 asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,1)"); 1032 asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,8)"); 1033 asm volatile("bndmov %bnd0, 0x12345678(%rax)"); 1034 asm volatile("bndmov %bnd0, 0x12345678(%rbp)"); 1035 asm volatile("bndmov %bnd0, 0x12345678(%rcx,%rax,1)"); 1036 asm volatile("bndmov %bnd0, 0x12345678(%rbp,%rax,1)"); 1037 asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,1)"); 1038 asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,8)"); 1039 1040 /* bndmov bnd2, bnd1 */ 1041 1042 asm volatile("bndmov %bnd0, %bnd1"); 1043 asm volatile("bndmov %bnd1, %bnd0"); 1044 1045 /* bndldx mib, bnd */ 1046 1047 asm volatile("bndldx (%rax), %bnd0"); 1048 asm volatile("bndldx (%r8), %bnd0"); 1049 asm volatile("bndldx (0x12345678), %bnd0"); 1050 asm volatile("bndldx (%rax), %bnd3"); 1051 asm volatile("bndldx (%rcx,%rax,1), %bnd0"); 1052 asm volatile("bndldx 0x12345678(,%rax,1), %bnd0"); 1053 asm volatile("bndldx (%rax,%rcx,1), %bnd0"); 1054 asm volatile("bndldx 0x12(%rax), %bnd0"); 1055 asm volatile("bndldx 0x12(%rbp), %bnd0"); 1056 asm volatile("bndldx 0x12(%rcx,%rax,1), %bnd0"); 1057 asm volatile("bndldx 0x12(%rbp,%rax,1), %bnd0"); 1058 asm volatile("bndldx 0x12(%rax,%rcx,1), %bnd0"); 1059 asm volatile("bndldx 0x12345678(%rax), %bnd0"); 1060 asm volatile("bndldx 0x12345678(%rbp), %bnd0"); 1061 asm volatile("bndldx 0x12345678(%rcx,%rax,1), %bnd0"); 1062 asm volatile("bndldx 0x12345678(%rbp,%rax,1), %bnd0"); 1063 asm volatile("bndldx 0x12345678(%rax,%rcx,1), %bnd0"); 1064 1065 /* bndstx bnd, mib */ 1066 1067 asm volatile("bndstx %bnd0, (%rax)"); 1068 asm volatile("bndstx %bnd0, (%r8)"); 1069 asm volatile("bndstx %bnd0, (0x12345678)"); 1070 asm volatile("bndstx %bnd3, (%rax)"); 1071 asm volatile("bndstx %bnd0, (%rcx,%rax,1)"); 1072 asm volatile("bndstx %bnd0, 0x12345678(,%rax,1)"); 1073 asm volatile("bndstx %bnd0, (%rax,%rcx,1)"); 1074 asm volatile("bndstx %bnd0, 0x12(%rax)"); 1075 asm volatile("bndstx %bnd0, 0x12(%rbp)"); 1076 asm volatile("bndstx %bnd0, 0x12(%rcx,%rax,1)"); 1077 asm volatile("bndstx %bnd0, 0x12(%rbp,%rax,1)"); 1078 asm volatile("bndstx %bnd0, 0x12(%rax,%rcx,1)"); 1079 asm volatile("bndstx %bnd0, 0x12345678(%rax)"); 1080 asm volatile("bndstx %bnd0, 0x12345678(%rbp)"); 1081 asm volatile("bndstx %bnd0, 0x12345678(%rcx,%rax,1)"); 1082 asm volatile("bndstx %bnd0, 0x12345678(%rbp,%rax,1)"); 1083 asm volatile("bndstx %bnd0, 0x12345678(%rax,%rcx,1)"); 1084 1085 /* bnd prefix on call, ret, jmp and all jcc */ 1086 1087 asm volatile("bnd call label1"); /* Expecting: call unconditional 0 */ 1088 asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 1089 asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 1090 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 1091 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 1092 asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 1093 asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0 */ 1094 1095 /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 1096 1097 asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 1098 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 1099 asm volatile("sha1rnds4 $0x91, %xmm8, %xmm0"); 1100 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm8"); 1101 asm volatile("sha1rnds4 $0x91, %xmm15, %xmm8"); 1102 asm volatile("sha1rnds4 $0x91, (%rax), %xmm0"); 1103 asm volatile("sha1rnds4 $0x91, (%r8), %xmm0"); 1104 asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 1105 asm volatile("sha1rnds4 $0x91, (%rax), %xmm3"); 1106 asm volatile("sha1rnds4 $0x91, (%rcx,%rax,1), %xmm0"); 1107 asm volatile("sha1rnds4 $0x91, 0x12345678(,%rax,1), %xmm0"); 1108 asm volatile("sha1rnds4 $0x91, (%rax,%rcx,1), %xmm0"); 1109 asm volatile("sha1rnds4 $0x91, (%rax,%rcx,8), %xmm0"); 1110 asm volatile("sha1rnds4 $0x91, 0x12(%rax), %xmm0"); 1111 asm volatile("sha1rnds4 $0x91, 0x12(%rbp), %xmm0"); 1112 asm volatile("sha1rnds4 $0x91, 0x12(%rcx,%rax,1), %xmm0"); 1113 asm volatile("sha1rnds4 $0x91, 0x12(%rbp,%rax,1), %xmm0"); 1114 asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,1), %xmm0"); 1115 asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,8), %xmm0"); 1116 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax), %xmm0"); 1117 asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp), %xmm0"); 1118 asm volatile("sha1rnds4 $0x91, 0x12345678(%rcx,%rax,1), %xmm0"); 1119 asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp,%rax,1), %xmm0"); 1120 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,1), %xmm0"); 1121 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm0"); 1122 asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm15"); 1123 1124 /* sha1nexte xmm2/m128, xmm1 */ 1125 1126 asm volatile("sha1nexte %xmm1, %xmm0"); 1127 asm volatile("sha1nexte %xmm7, %xmm2"); 1128 asm volatile("sha1nexte %xmm8, %xmm0"); 1129 asm volatile("sha1nexte %xmm7, %xmm8"); 1130 asm volatile("sha1nexte %xmm15, %xmm8"); 1131 asm volatile("sha1nexte (%rax), %xmm0"); 1132 asm volatile("sha1nexte (%r8), %xmm0"); 1133 asm volatile("sha1nexte (0x12345678), %xmm0"); 1134 asm volatile("sha1nexte (%rax), %xmm3"); 1135 asm volatile("sha1nexte (%rcx,%rax,1), %xmm0"); 1136 asm volatile("sha1nexte 0x12345678(,%rax,1), %xmm0"); 1137 asm volatile("sha1nexte (%rax,%rcx,1), %xmm0"); 1138 asm volatile("sha1nexte (%rax,%rcx,8), %xmm0"); 1139 asm volatile("sha1nexte 0x12(%rax), %xmm0"); 1140 asm volatile("sha1nexte 0x12(%rbp), %xmm0"); 1141 asm volatile("sha1nexte 0x12(%rcx,%rax,1), %xmm0"); 1142 asm volatile("sha1nexte 0x12(%rbp,%rax,1), %xmm0"); 1143 asm volatile("sha1nexte 0x12(%rax,%rcx,1), %xmm0"); 1144 asm volatile("sha1nexte 0x12(%rax,%rcx,8), %xmm0"); 1145 asm volatile("sha1nexte 0x12345678(%rax), %xmm0"); 1146 asm volatile("sha1nexte 0x12345678(%rbp), %xmm0"); 1147 asm volatile("sha1nexte 0x12345678(%rcx,%rax,1), %xmm0"); 1148 asm volatile("sha1nexte 0x12345678(%rbp,%rax,1), %xmm0"); 1149 asm volatile("sha1nexte 0x12345678(%rax,%rcx,1), %xmm0"); 1150 asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm0"); 1151 asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm15"); 1152 1153 /* sha1msg1 xmm2/m128, xmm1 */ 1154 1155 asm volatile("sha1msg1 %xmm1, %xmm0"); 1156 asm volatile("sha1msg1 %xmm7, %xmm2"); 1157 asm volatile("sha1msg1 %xmm8, %xmm0"); 1158 asm volatile("sha1msg1 %xmm7, %xmm8"); 1159 asm volatile("sha1msg1 %xmm15, %xmm8"); 1160 asm volatile("sha1msg1 (%rax), %xmm0"); 1161 asm volatile("sha1msg1 (%r8), %xmm0"); 1162 asm volatile("sha1msg1 (0x12345678), %xmm0"); 1163 asm volatile("sha1msg1 (%rax), %xmm3"); 1164 asm volatile("sha1msg1 (%rcx,%rax,1), %xmm0"); 1165 asm volatile("sha1msg1 0x12345678(,%rax,1), %xmm0"); 1166 asm volatile("sha1msg1 (%rax,%rcx,1), %xmm0"); 1167 asm volatile("sha1msg1 (%rax,%rcx,8), %xmm0"); 1168 asm volatile("sha1msg1 0x12(%rax), %xmm0"); 1169 asm volatile("sha1msg1 0x12(%rbp), %xmm0"); 1170 asm volatile("sha1msg1 0x12(%rcx,%rax,1), %xmm0"); 1171 asm volatile("sha1msg1 0x12(%rbp,%rax,1), %xmm0"); 1172 asm volatile("sha1msg1 0x12(%rax,%rcx,1), %xmm0"); 1173 asm volatile("sha1msg1 0x12(%rax,%rcx,8), %xmm0"); 1174 asm volatile("sha1msg1 0x12345678(%rax), %xmm0"); 1175 asm volatile("sha1msg1 0x12345678(%rbp), %xmm0"); 1176 asm volatile("sha1msg1 0x12345678(%rcx,%rax,1), %xmm0"); 1177 asm volatile("sha1msg1 0x12345678(%rbp,%rax,1), %xmm0"); 1178 asm volatile("sha1msg1 0x12345678(%rax,%rcx,1), %xmm0"); 1179 asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm0"); 1180 asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm15"); 1181 1182 /* sha1msg2 xmm2/m128, xmm1 */ 1183 1184 asm volatile("sha1msg2 %xmm1, %xmm0"); 1185 asm volatile("sha1msg2 %xmm7, %xmm2"); 1186 asm volatile("sha1msg2 %xmm8, %xmm0"); 1187 asm volatile("sha1msg2 %xmm7, %xmm8"); 1188 asm volatile("sha1msg2 %xmm15, %xmm8"); 1189 asm volatile("sha1msg2 (%rax), %xmm0"); 1190 asm volatile("sha1msg2 (%r8), %xmm0"); 1191 asm volatile("sha1msg2 (0x12345678), %xmm0"); 1192 asm volatile("sha1msg2 (%rax), %xmm3"); 1193 asm volatile("sha1msg2 (%rcx,%rax,1), %xmm0"); 1194 asm volatile("sha1msg2 0x12345678(,%rax,1), %xmm0"); 1195 asm volatile("sha1msg2 (%rax,%rcx,1), %xmm0"); 1196 asm volatile("sha1msg2 (%rax,%rcx,8), %xmm0"); 1197 asm volatile("sha1msg2 0x12(%rax), %xmm0"); 1198 asm volatile("sha1msg2 0x12(%rbp), %xmm0"); 1199 asm volatile("sha1msg2 0x12(%rcx,%rax,1), %xmm0"); 1200 asm volatile("sha1msg2 0x12(%rbp,%rax,1), %xmm0"); 1201 asm volatile("sha1msg2 0x12(%rax,%rcx,1), %xmm0"); 1202 asm volatile("sha1msg2 0x12(%rax,%rcx,8), %xmm0"); 1203 asm volatile("sha1msg2 0x12345678(%rax), %xmm0"); 1204 asm volatile("sha1msg2 0x12345678(%rbp), %xmm0"); 1205 asm volatile("sha1msg2 0x12345678(%rcx,%rax,1), %xmm0"); 1206 asm volatile("sha1msg2 0x12345678(%rbp,%rax,1), %xmm0"); 1207 asm volatile("sha1msg2 0x12345678(%rax,%rcx,1), %xmm0"); 1208 asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm0"); 1209 asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm15"); 1210 1211 /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 1212 /* Note sha256rnds2 has an implicit operand 'xmm0' */ 1213 1214 asm volatile("sha256rnds2 %xmm4, %xmm1"); 1215 asm volatile("sha256rnds2 %xmm7, %xmm2"); 1216 asm volatile("sha256rnds2 %xmm8, %xmm1"); 1217 asm volatile("sha256rnds2 %xmm7, %xmm8"); 1218 asm volatile("sha256rnds2 %xmm15, %xmm8"); 1219 asm volatile("sha256rnds2 (%rax), %xmm1"); 1220 asm volatile("sha256rnds2 (%r8), %xmm1"); 1221 asm volatile("sha256rnds2 (0x12345678), %xmm1"); 1222 asm volatile("sha256rnds2 (%rax), %xmm3"); 1223 asm volatile("sha256rnds2 (%rcx,%rax,1), %xmm1"); 1224 asm volatile("sha256rnds2 0x12345678(,%rax,1), %xmm1"); 1225 asm volatile("sha256rnds2 (%rax,%rcx,1), %xmm1"); 1226 asm volatile("sha256rnds2 (%rax,%rcx,8), %xmm1"); 1227 asm volatile("sha256rnds2 0x12(%rax), %xmm1"); 1228 asm volatile("sha256rnds2 0x12(%rbp), %xmm1"); 1229 asm volatile("sha256rnds2 0x12(%rcx,%rax,1), %xmm1"); 1230 asm volatile("sha256rnds2 0x12(%rbp,%rax,1), %xmm1"); 1231 asm volatile("sha256rnds2 0x12(%rax,%rcx,1), %xmm1"); 1232 asm volatile("sha256rnds2 0x12(%rax,%rcx,8), %xmm1"); 1233 asm volatile("sha256rnds2 0x12345678(%rax), %xmm1"); 1234 asm volatile("sha256rnds2 0x12345678(%rbp), %xmm1"); 1235 asm volatile("sha256rnds2 0x12345678(%rcx,%rax,1), %xmm1"); 1236 asm volatile("sha256rnds2 0x12345678(%rbp,%rax,1), %xmm1"); 1237 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,1), %xmm1"); 1238 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm1"); 1239 asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm15"); 1240 1241 /* sha256msg1 xmm2/m128, xmm1 */ 1242 1243 asm volatile("sha256msg1 %xmm1, %xmm0"); 1244 asm volatile("sha256msg1 %xmm7, %xmm2"); 1245 asm volatile("sha256msg1 %xmm8, %xmm0"); 1246 asm volatile("sha256msg1 %xmm7, %xmm8"); 1247 asm volatile("sha256msg1 %xmm15, %xmm8"); 1248 asm volatile("sha256msg1 (%rax), %xmm0"); 1249 asm volatile("sha256msg1 (%r8), %xmm0"); 1250 asm volatile("sha256msg1 (0x12345678), %xmm0"); 1251 asm volatile("sha256msg1 (%rax), %xmm3"); 1252 asm volatile("sha256msg1 (%rcx,%rax,1), %xmm0"); 1253 asm volatile("sha256msg1 0x12345678(,%rax,1), %xmm0"); 1254 asm volatile("sha256msg1 (%rax,%rcx,1), %xmm0"); 1255 asm volatile("sha256msg1 (%rax,%rcx,8), %xmm0"); 1256 asm volatile("sha256msg1 0x12(%rax), %xmm0"); 1257 asm volatile("sha256msg1 0x12(%rbp), %xmm0"); 1258 asm volatile("sha256msg1 0x12(%rcx,%rax,1), %xmm0"); 1259 asm volatile("sha256msg1 0x12(%rbp,%rax,1), %xmm0"); 1260 asm volatile("sha256msg1 0x12(%rax,%rcx,1), %xmm0"); 1261 asm volatile("sha256msg1 0x12(%rax,%rcx,8), %xmm0"); 1262 asm volatile("sha256msg1 0x12345678(%rax), %xmm0"); 1263 asm volatile("sha256msg1 0x12345678(%rbp), %xmm0"); 1264 asm volatile("sha256msg1 0x12345678(%rcx,%rax,1), %xmm0"); 1265 asm volatile("sha256msg1 0x12345678(%rbp,%rax,1), %xmm0"); 1266 asm volatile("sha256msg1 0x12345678(%rax,%rcx,1), %xmm0"); 1267 asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm0"); 1268 asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm15"); 1269 1270 /* sha256msg2 xmm2/m128, xmm1 */ 1271 1272 asm volatile("sha256msg2 %xmm1, %xmm0"); 1273 asm volatile("sha256msg2 %xmm7, %xmm2"); 1274 asm volatile("sha256msg2 %xmm8, %xmm0"); 1275 asm volatile("sha256msg2 %xmm7, %xmm8"); 1276 asm volatile("sha256msg2 %xmm15, %xmm8"); 1277 asm volatile("sha256msg2 (%rax), %xmm0"); 1278 asm volatile("sha256msg2 (%r8), %xmm0"); 1279 asm volatile("sha256msg2 (0x12345678), %xmm0"); 1280 asm volatile("sha256msg2 (%rax), %xmm3"); 1281 asm volatile("sha256msg2 (%rcx,%rax,1), %xmm0"); 1282 asm volatile("sha256msg2 0x12345678(,%rax,1), %xmm0"); 1283 asm volatile("sha256msg2 (%rax,%rcx,1), %xmm0"); 1284 asm volatile("sha256msg2 (%rax,%rcx,8), %xmm0"); 1285 asm volatile("sha256msg2 0x12(%rax), %xmm0"); 1286 asm volatile("sha256msg2 0x12(%rbp), %xmm0"); 1287 asm volatile("sha256msg2 0x12(%rcx,%rax,1), %xmm0"); 1288 asm volatile("sha256msg2 0x12(%rbp,%rax,1), %xmm0"); 1289 asm volatile("sha256msg2 0x12(%rax,%rcx,1), %xmm0"); 1290 asm volatile("sha256msg2 0x12(%rax,%rcx,8), %xmm0"); 1291 asm volatile("sha256msg2 0x12345678(%rax), %xmm0"); 1292 asm volatile("sha256msg2 0x12345678(%rbp), %xmm0"); 1293 asm volatile("sha256msg2 0x12345678(%rcx,%rax,1), %xmm0"); 1294 asm volatile("sha256msg2 0x12345678(%rbp,%rax,1), %xmm0"); 1295 asm volatile("sha256msg2 0x12345678(%rax,%rcx,1), %xmm0"); 1296 asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm0"); 1297 asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm15"); 1298 1299 /* clflushopt m8 */ 1300 1301 asm volatile("clflushopt (%rax)"); 1302 asm volatile("clflushopt (%r8)"); 1303 asm volatile("clflushopt (0x12345678)"); 1304 asm volatile("clflushopt 0x12345678(%rax,%rcx,8)"); 1305 asm volatile("clflushopt 0x12345678(%r8,%rcx,8)"); 1306 /* Also check instructions in the same group encoding as clflushopt */ 1307 asm volatile("clflush (%rax)"); 1308 asm volatile("clflush (%r8)"); 1309 asm volatile("sfence"); 1310 1311 /* clwb m8 */ 1312 1313 asm volatile("clwb (%rax)"); 1314 asm volatile("clwb (%r8)"); 1315 asm volatile("clwb (0x12345678)"); 1316 asm volatile("clwb 0x12345678(%rax,%rcx,8)"); 1317 asm volatile("clwb 0x12345678(%r8,%rcx,8)"); 1318 /* Also check instructions in the same group encoding as clwb */ 1319 asm volatile("xsaveopt (%rax)"); 1320 asm volatile("xsaveopt (%r8)"); 1321 asm volatile("mfence"); 1322 1323 /* xsavec mem */ 1324 1325 asm volatile("xsavec (%rax)"); 1326 asm volatile("xsavec (%r8)"); 1327 asm volatile("xsavec (0x12345678)"); 1328 asm volatile("xsavec 0x12345678(%rax,%rcx,8)"); 1329 asm volatile("xsavec 0x12345678(%r8,%rcx,8)"); 1330 1331 /* xsaves mem */ 1332 1333 asm volatile("xsaves (%rax)"); 1334 asm volatile("xsaves (%r8)"); 1335 asm volatile("xsaves (0x12345678)"); 1336 asm volatile("xsaves 0x12345678(%rax,%rcx,8)"); 1337 asm volatile("xsaves 0x12345678(%r8,%rcx,8)"); 1338 1339 /* xrstors mem */ 1340 1341 asm volatile("xrstors (%rax)"); 1342 asm volatile("xrstors (%r8)"); 1343 asm volatile("xrstors (0x12345678)"); 1344 asm volatile("xrstors 0x12345678(%rax,%rcx,8)"); 1345 asm volatile("xrstors 0x12345678(%r8,%rcx,8)"); 1346 1347 /* ptwrite */ 1348 1349 asm volatile("ptwrite (%rax)"); 1350 asm volatile("ptwrite (%r8)"); 1351 asm volatile("ptwrite (0x12345678)"); 1352 asm volatile("ptwrite 0x12345678(%rax,%rcx,8)"); 1353 asm volatile("ptwrite 0x12345678(%r8,%rcx,8)"); 1354 1355 asm volatile("ptwritel (%rax)"); 1356 asm volatile("ptwritel (%r8)"); 1357 asm volatile("ptwritel (0x12345678)"); 1358 asm volatile("ptwritel 0x12345678(%rax,%rcx,8)"); 1359 asm volatile("ptwritel 0x12345678(%r8,%rcx,8)"); 1360 1361 asm volatile("ptwriteq (%rax)"); 1362 asm volatile("ptwriteq (%r8)"); 1363 asm volatile("ptwriteq (0x12345678)"); 1364 asm volatile("ptwriteq 0x12345678(%rax,%rcx,8)"); 1365 asm volatile("ptwriteq 0x12345678(%r8,%rcx,8)"); 1366 1367 #else /* #ifdef __x86_64__ */ 1368 1369 /* bound r32, mem (same op code as EVEX prefix) */ 1370 1371 asm volatile("bound %eax, 0x12345678(%ecx)"); 1372 asm volatile("bound %ecx, 0x12345678(%eax)"); 1373 asm volatile("bound %edx, 0x12345678(%eax)"); 1374 asm volatile("bound %ebx, 0x12345678(%eax)"); 1375 asm volatile("bound %esp, 0x12345678(%eax)"); 1376 asm volatile("bound %ebp, 0x12345678(%eax)"); 1377 asm volatile("bound %esi, 0x12345678(%eax)"); 1378 asm volatile("bound %edi, 0x12345678(%eax)"); 1379 asm volatile("bound %ecx, (%eax)"); 1380 asm volatile("bound %eax, (0x12345678)"); 1381 asm volatile("bound %edx, (%ecx,%eax,1)"); 1382 asm volatile("bound %edx, 0x12345678(,%eax,1)"); 1383 asm volatile("bound %edx, (%eax,%ecx,1)"); 1384 asm volatile("bound %edx, (%eax,%ecx,8)"); 1385 asm volatile("bound %edx, 0x12(%eax)"); 1386 asm volatile("bound %edx, 0x12(%ebp)"); 1387 asm volatile("bound %edx, 0x12(%ecx,%eax,1)"); 1388 asm volatile("bound %edx, 0x12(%ebp,%eax,1)"); 1389 asm volatile("bound %edx, 0x12(%eax,%ecx,1)"); 1390 asm volatile("bound %edx, 0x12(%eax,%ecx,8)"); 1391 asm volatile("bound %edx, 0x12345678(%eax)"); 1392 asm volatile("bound %edx, 0x12345678(%ebp)"); 1393 asm volatile("bound %edx, 0x12345678(%ecx,%eax,1)"); 1394 asm volatile("bound %edx, 0x12345678(%ebp,%eax,1)"); 1395 asm volatile("bound %edx, 0x12345678(%eax,%ecx,1)"); 1396 asm volatile("bound %edx, 0x12345678(%eax,%ecx,8)"); 1397 1398 /* bound r16, mem (same op code as EVEX prefix) */ 1399 1400 asm volatile("bound %ax, 0x12345678(%ecx)"); 1401 asm volatile("bound %cx, 0x12345678(%eax)"); 1402 asm volatile("bound %dx, 0x12345678(%eax)"); 1403 asm volatile("bound %bx, 0x12345678(%eax)"); 1404 asm volatile("bound %sp, 0x12345678(%eax)"); 1405 asm volatile("bound %bp, 0x12345678(%eax)"); 1406 asm volatile("bound %si, 0x12345678(%eax)"); 1407 asm volatile("bound %di, 0x12345678(%eax)"); 1408 asm volatile("bound %cx, (%eax)"); 1409 asm volatile("bound %ax, (0x12345678)"); 1410 asm volatile("bound %dx, (%ecx,%eax,1)"); 1411 asm volatile("bound %dx, 0x12345678(,%eax,1)"); 1412 asm volatile("bound %dx, (%eax,%ecx,1)"); 1413 asm volatile("bound %dx, (%eax,%ecx,8)"); 1414 asm volatile("bound %dx, 0x12(%eax)"); 1415 asm volatile("bound %dx, 0x12(%ebp)"); 1416 asm volatile("bound %dx, 0x12(%ecx,%eax,1)"); 1417 asm volatile("bound %dx, 0x12(%ebp,%eax,1)"); 1418 asm volatile("bound %dx, 0x12(%eax,%ecx,1)"); 1419 asm volatile("bound %dx, 0x12(%eax,%ecx,8)"); 1420 asm volatile("bound %dx, 0x12345678(%eax)"); 1421 asm volatile("bound %dx, 0x12345678(%ebp)"); 1422 asm volatile("bound %dx, 0x12345678(%ecx,%eax,1)"); 1423 asm volatile("bound %dx, 0x12345678(%ebp,%eax,1)"); 1424 asm volatile("bound %dx, 0x12345678(%eax,%ecx,1)"); 1425 asm volatile("bound %dx, 0x12345678(%eax,%ecx,8)"); 1426 1427 /* AVX-512: Instructions with the same op codes as Mask Instructions */ 1428 1429 asm volatile("cmovno %eax,%ebx"); 1430 asm volatile("cmovno 0x12345678(%eax),%ecx"); 1431 asm volatile("cmovno 0x12345678(%eax),%cx"); 1432 1433 asm volatile("cmove %eax,%ebx"); 1434 asm volatile("cmove 0x12345678(%eax),%ecx"); 1435 asm volatile("cmove 0x12345678(%eax),%cx"); 1436 1437 asm volatile("seto 0x12345678(%eax)"); 1438 asm volatile("setno 0x12345678(%eax)"); 1439 asm volatile("setb 0x12345678(%eax)"); 1440 asm volatile("setc 0x12345678(%eax)"); 1441 asm volatile("setnae 0x12345678(%eax)"); 1442 asm volatile("setae 0x12345678(%eax)"); 1443 asm volatile("setnb 0x12345678(%eax)"); 1444 asm volatile("setnc 0x12345678(%eax)"); 1445 asm volatile("sets 0x12345678(%eax)"); 1446 asm volatile("setns 0x12345678(%eax)"); 1447 1448 /* AVX-512: Mask Instructions */ 1449 1450 asm volatile("kandw %k7,%k6,%k5"); 1451 asm volatile("kandq %k7,%k6,%k5"); 1452 asm volatile("kandb %k7,%k6,%k5"); 1453 asm volatile("kandd %k7,%k6,%k5"); 1454 1455 asm volatile("kandnw %k7,%k6,%k5"); 1456 asm volatile("kandnq %k7,%k6,%k5"); 1457 asm volatile("kandnb %k7,%k6,%k5"); 1458 asm volatile("kandnd %k7,%k6,%k5"); 1459 1460 asm volatile("knotw %k7,%k6"); 1461 asm volatile("knotq %k7,%k6"); 1462 asm volatile("knotb %k7,%k6"); 1463 asm volatile("knotd %k7,%k6"); 1464 1465 asm volatile("korw %k7,%k6,%k5"); 1466 asm volatile("korq %k7,%k6,%k5"); 1467 asm volatile("korb %k7,%k6,%k5"); 1468 asm volatile("kord %k7,%k6,%k5"); 1469 1470 asm volatile("kxnorw %k7,%k6,%k5"); 1471 asm volatile("kxnorq %k7,%k6,%k5"); 1472 asm volatile("kxnorb %k7,%k6,%k5"); 1473 asm volatile("kxnord %k7,%k6,%k5"); 1474 1475 asm volatile("kxorw %k7,%k6,%k5"); 1476 asm volatile("kxorq %k7,%k6,%k5"); 1477 asm volatile("kxorb %k7,%k6,%k5"); 1478 asm volatile("kxord %k7,%k6,%k5"); 1479 1480 asm volatile("kaddw %k7,%k6,%k5"); 1481 asm volatile("kaddq %k7,%k6,%k5"); 1482 asm volatile("kaddb %k7,%k6,%k5"); 1483 asm volatile("kaddd %k7,%k6,%k5"); 1484 1485 asm volatile("kunpckbw %k7,%k6,%k5"); 1486 asm volatile("kunpckwd %k7,%k6,%k5"); 1487 asm volatile("kunpckdq %k7,%k6,%k5"); 1488 1489 asm volatile("kmovw %k6,%k5"); 1490 asm volatile("kmovw (%ecx),%k5"); 1491 asm volatile("kmovw 0x123(%eax,%ecx,8),%k5"); 1492 asm volatile("kmovw %k5,(%ecx)"); 1493 asm volatile("kmovw %k5,0x123(%eax,%ecx,8)"); 1494 asm volatile("kmovw %eax,%k5"); 1495 asm volatile("kmovw %ebp,%k5"); 1496 asm volatile("kmovw %k5,%eax"); 1497 asm volatile("kmovw %k5,%ebp"); 1498 1499 asm volatile("kmovq %k6,%k5"); 1500 asm volatile("kmovq (%ecx),%k5"); 1501 asm volatile("kmovq 0x123(%eax,%ecx,8),%k5"); 1502 asm volatile("kmovq %k5,(%ecx)"); 1503 asm volatile("kmovq %k5,0x123(%eax,%ecx,8)"); 1504 1505 asm volatile("kmovb %k6,%k5"); 1506 asm volatile("kmovb (%ecx),%k5"); 1507 asm volatile("kmovb 0x123(%eax,%ecx,8),%k5"); 1508 asm volatile("kmovb %k5,(%ecx)"); 1509 asm volatile("kmovb %k5,0x123(%eax,%ecx,8)"); 1510 asm volatile("kmovb %eax,%k5"); 1511 asm volatile("kmovb %ebp,%k5"); 1512 asm volatile("kmovb %k5,%eax"); 1513 asm volatile("kmovb %k5,%ebp"); 1514 1515 asm volatile("kmovd %k6,%k5"); 1516 asm volatile("kmovd (%ecx),%k5"); 1517 asm volatile("kmovd 0x123(%eax,%ecx,8),%k5"); 1518 asm volatile("kmovd %k5,(%ecx)"); 1519 asm volatile("kmovd %k5,0x123(%eax,%ecx,8)"); 1520 asm volatile("kmovd %eax,%k5"); 1521 asm volatile("kmovd %ebp,%k5"); 1522 asm volatile("kmovd %k5,%eax"); 1523 asm volatile("kmovd %k5,%ebp"); 1524 1525 asm volatile("kortestw %k6,%k5"); 1526 asm volatile("kortestq %k6,%k5"); 1527 asm volatile("kortestb %k6,%k5"); 1528 asm volatile("kortestd %k6,%k5"); 1529 1530 asm volatile("ktestw %k6,%k5"); 1531 asm volatile("ktestq %k6,%k5"); 1532 asm volatile("ktestb %k6,%k5"); 1533 asm volatile("ktestd %k6,%k5"); 1534 1535 asm volatile("kshiftrw $0x12,%k6,%k5"); 1536 asm volatile("kshiftrq $0x5b,%k6,%k5"); 1537 asm volatile("kshiftlw $0x12,%k6,%k5"); 1538 asm volatile("kshiftlq $0x5b,%k6,%k5"); 1539 1540 /* AVX-512: Op code 0f 5b */ 1541 asm volatile("vcvtdq2ps %xmm5,%xmm6"); 1542 asm volatile("vcvtqq2ps %zmm5,%ymm6{%k7}"); 1543 asm volatile("vcvtps2dq %xmm5,%xmm6"); 1544 asm volatile("vcvttps2dq %xmm5,%xmm6"); 1545 1546 /* AVX-512: Op code 0f 6f */ 1547 1548 asm volatile("movq %mm0,%mm4"); 1549 asm volatile("vmovdqa %ymm4,%ymm6"); 1550 asm volatile("vmovdqa32 %zmm5,%zmm6"); 1551 asm volatile("vmovdqa64 %zmm5,%zmm6"); 1552 asm volatile("vmovdqu %ymm4,%ymm6"); 1553 asm volatile("vmovdqu32 %zmm5,%zmm6"); 1554 asm volatile("vmovdqu64 %zmm5,%zmm6"); 1555 asm volatile("vmovdqu8 %zmm5,%zmm6"); 1556 asm volatile("vmovdqu16 %zmm5,%zmm6"); 1557 1558 /* AVX-512: Op code 0f 78 */ 1559 1560 asm volatile("vmread %eax,%ebx"); 1561 asm volatile("vcvttps2udq %zmm5,%zmm6"); 1562 asm volatile("vcvttpd2udq %zmm5,%ymm6{%k7}"); 1563 asm volatile("vcvttsd2usi %xmm6,%eax"); 1564 asm volatile("vcvttss2usi %xmm6,%eax"); 1565 asm volatile("vcvttps2uqq %ymm5,%zmm6{%k7}"); 1566 asm volatile("vcvttpd2uqq %zmm5,%zmm6"); 1567 1568 /* AVX-512: Op code 0f 79 */ 1569 1570 asm volatile("vmwrite %eax,%ebx"); 1571 asm volatile("vcvtps2udq %zmm5,%zmm6"); 1572 asm volatile("vcvtpd2udq %zmm5,%ymm6{%k7}"); 1573 asm volatile("vcvtsd2usi %xmm6,%eax"); 1574 asm volatile("vcvtss2usi %xmm6,%eax"); 1575 asm volatile("vcvtps2uqq %ymm5,%zmm6{%k7}"); 1576 asm volatile("vcvtpd2uqq %zmm5,%zmm6"); 1577 1578 /* AVX-512: Op code 0f 7a */ 1579 1580 asm volatile("vcvtudq2pd %ymm5,%zmm6{%k7}"); 1581 asm volatile("vcvtuqq2pd %zmm5,%zmm6"); 1582 asm volatile("vcvtudq2ps %zmm5,%zmm6"); 1583 asm volatile("vcvtuqq2ps %zmm5,%ymm6{%k7}"); 1584 asm volatile("vcvttps2qq %ymm5,%zmm6{%k7}"); 1585 asm volatile("vcvttpd2qq %zmm5,%zmm6"); 1586 1587 /* AVX-512: Op code 0f 7b */ 1588 1589 asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 1590 asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 1591 asm volatile("vcvtps2qq %ymm5,%zmm6{%k7}"); 1592 asm volatile("vcvtpd2qq %zmm5,%zmm6"); 1593 1594 /* AVX-512: Op code 0f 7f */ 1595 1596 asm volatile("movq.s %mm0,%mm4"); 1597 asm volatile("vmovdqa.s %ymm5,%ymm6"); 1598 asm volatile("vmovdqa32.s %zmm5,%zmm6"); 1599 asm volatile("vmovdqa64.s %zmm5,%zmm6"); 1600 asm volatile("vmovdqu.s %ymm5,%ymm6"); 1601 asm volatile("vmovdqu32.s %zmm5,%zmm6"); 1602 asm volatile("vmovdqu64.s %zmm5,%zmm6"); 1603 asm volatile("vmovdqu8.s %zmm5,%zmm6"); 1604 asm volatile("vmovdqu16.s %zmm5,%zmm6"); 1605 1606 /* AVX-512: Op code 0f db */ 1607 1608 asm volatile("pand %mm1,%mm2"); 1609 asm volatile("pand %xmm1,%xmm2"); 1610 asm volatile("vpand %ymm4,%ymm6,%ymm2"); 1611 asm volatile("vpandd %zmm4,%zmm5,%zmm6"); 1612 asm volatile("vpandq %zmm4,%zmm5,%zmm6"); 1613 1614 /* AVX-512: Op code 0f df */ 1615 1616 asm volatile("pandn %mm1,%mm2"); 1617 asm volatile("pandn %xmm1,%xmm2"); 1618 asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 1619 asm volatile("vpandnd %zmm4,%zmm5,%zmm6"); 1620 asm volatile("vpandnq %zmm4,%zmm5,%zmm6"); 1621 1622 /* AVX-512: Op code 0f e6 */ 1623 1624 asm volatile("vcvttpd2dq %xmm1,%xmm2"); 1625 asm volatile("vcvtdq2pd %xmm5,%xmm6"); 1626 asm volatile("vcvtdq2pd %ymm5,%zmm6{%k7}"); 1627 asm volatile("vcvtqq2pd %zmm5,%zmm6"); 1628 asm volatile("vcvtpd2dq %xmm1,%xmm2"); 1629 1630 /* AVX-512: Op code 0f eb */ 1631 1632 asm volatile("por %mm4,%mm6"); 1633 asm volatile("vpor %ymm4,%ymm6,%ymm2"); 1634 asm volatile("vpord %zmm4,%zmm5,%zmm6"); 1635 asm volatile("vporq %zmm4,%zmm5,%zmm6"); 1636 1637 /* AVX-512: Op code 0f ef */ 1638 1639 asm volatile("pxor %mm4,%mm6"); 1640 asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 1641 asm volatile("vpxord %zmm4,%zmm5,%zmm6"); 1642 asm volatile("vpxorq %zmm4,%zmm5,%zmm6"); 1643 1644 /* AVX-512: Op code 0f 38 10 */ 1645 1646 asm volatile("pblendvb %xmm1,%xmm0"); 1647 asm volatile("vpsrlvw %zmm4,%zmm5,%zmm6"); 1648 asm volatile("vpmovuswb %zmm5,%ymm6{%k7}"); 1649 1650 /* AVX-512: Op code 0f 38 11 */ 1651 1652 asm volatile("vpmovusdb %zmm5,%xmm6{%k7}"); 1653 asm volatile("vpsravw %zmm4,%zmm5,%zmm6"); 1654 1655 /* AVX-512: Op code 0f 38 12 */ 1656 1657 asm volatile("vpmovusqb %zmm5,%xmm6{%k7}"); 1658 asm volatile("vpsllvw %zmm4,%zmm5,%zmm6"); 1659 1660 /* AVX-512: Op code 0f 38 13 */ 1661 1662 asm volatile("vcvtph2ps %xmm3,%ymm5"); 1663 asm volatile("vcvtph2ps %ymm5,%zmm6{%k7}"); 1664 asm volatile("vpmovusdw %zmm5,%ymm6{%k7}"); 1665 1666 /* AVX-512: Op code 0f 38 14 */ 1667 1668 asm volatile("blendvps %xmm1,%xmm0"); 1669 asm volatile("vpmovusqw %zmm5,%xmm6{%k7}"); 1670 asm volatile("vprorvd %zmm4,%zmm5,%zmm6"); 1671 asm volatile("vprorvq %zmm4,%zmm5,%zmm6"); 1672 1673 /* AVX-512: Op code 0f 38 15 */ 1674 1675 asm volatile("blendvpd %xmm1,%xmm0"); 1676 asm volatile("vpmovusqd %zmm5,%ymm6{%k7}"); 1677 asm volatile("vprolvd %zmm4,%zmm5,%zmm6"); 1678 asm volatile("vprolvq %zmm4,%zmm5,%zmm6"); 1679 1680 /* AVX-512: Op code 0f 38 16 */ 1681 1682 asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 1683 asm volatile("vpermps %ymm4,%ymm6,%ymm2{%k7}"); 1684 asm volatile("vpermpd %ymm4,%ymm6,%ymm2{%k7}"); 1685 1686 /* AVX-512: Op code 0f 38 19 */ 1687 1688 asm volatile("vbroadcastsd %xmm4,%ymm6"); 1689 asm volatile("vbroadcastf32x2 %xmm7,%zmm6"); 1690 1691 /* AVX-512: Op code 0f 38 1a */ 1692 1693 asm volatile("vbroadcastf128 (%ecx),%ymm4"); 1694 asm volatile("vbroadcastf32x4 (%ecx),%zmm6"); 1695 asm volatile("vbroadcastf64x2 (%ecx),%zmm6"); 1696 1697 /* AVX-512: Op code 0f 38 1b */ 1698 1699 asm volatile("vbroadcastf32x8 (%ecx),%zmm6"); 1700 asm volatile("vbroadcastf64x4 (%ecx),%zmm6"); 1701 1702 /* AVX-512: Op code 0f 38 1f */ 1703 1704 asm volatile("vpabsq %zmm4,%zmm6"); 1705 1706 /* AVX-512: Op code 0f 38 20 */ 1707 1708 asm volatile("vpmovsxbw %xmm4,%xmm5"); 1709 asm volatile("vpmovswb %zmm5,%ymm6{%k7}"); 1710 1711 /* AVX-512: Op code 0f 38 21 */ 1712 1713 asm volatile("vpmovsxbd %xmm4,%ymm6"); 1714 asm volatile("vpmovsdb %zmm5,%xmm6{%k7}"); 1715 1716 /* AVX-512: Op code 0f 38 22 */ 1717 1718 asm volatile("vpmovsxbq %xmm4,%ymm4"); 1719 asm volatile("vpmovsqb %zmm5,%xmm6{%k7}"); 1720 1721 /* AVX-512: Op code 0f 38 23 */ 1722 1723 asm volatile("vpmovsxwd %xmm4,%ymm4"); 1724 asm volatile("vpmovsdw %zmm5,%ymm6{%k7}"); 1725 1726 /* AVX-512: Op code 0f 38 24 */ 1727 1728 asm volatile("vpmovsxwq %xmm4,%ymm6"); 1729 asm volatile("vpmovsqw %zmm5,%xmm6{%k7}"); 1730 1731 /* AVX-512: Op code 0f 38 25 */ 1732 1733 asm volatile("vpmovsxdq %xmm4,%ymm4"); 1734 asm volatile("vpmovsqd %zmm5,%ymm6{%k7}"); 1735 1736 /* AVX-512: Op code 0f 38 26 */ 1737 1738 asm volatile("vptestmb %zmm5,%zmm6,%k5"); 1739 asm volatile("vptestmw %zmm5,%zmm6,%k5"); 1740 asm volatile("vptestnmb %zmm4,%zmm5,%k5"); 1741 asm volatile("vptestnmw %zmm4,%zmm5,%k5"); 1742 1743 /* AVX-512: Op code 0f 38 27 */ 1744 1745 asm volatile("vptestmd %zmm5,%zmm6,%k5"); 1746 asm volatile("vptestmq %zmm5,%zmm6,%k5"); 1747 asm volatile("vptestnmd %zmm4,%zmm5,%k5"); 1748 asm volatile("vptestnmq %zmm4,%zmm5,%k5"); 1749 1750 /* AVX-512: Op code 0f 38 28 */ 1751 1752 asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 1753 asm volatile("vpmovm2b %k5,%zmm6"); 1754 asm volatile("vpmovm2w %k5,%zmm6"); 1755 1756 /* AVX-512: Op code 0f 38 29 */ 1757 1758 asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 1759 asm volatile("vpmovb2m %zmm6,%k5"); 1760 asm volatile("vpmovw2m %zmm6,%k5"); 1761 1762 /* AVX-512: Op code 0f 38 2a */ 1763 1764 asm volatile("vmovntdqa (%ecx),%ymm4"); 1765 asm volatile("vpbroadcastmb2q %k6,%zmm1"); 1766 1767 /* AVX-512: Op code 0f 38 2c */ 1768 1769 asm volatile("vmaskmovps (%ecx),%ymm4,%ymm6"); 1770 asm volatile("vscalefps %zmm4,%zmm5,%zmm6"); 1771 asm volatile("vscalefpd %zmm4,%zmm5,%zmm6"); 1772 1773 /* AVX-512: Op code 0f 38 2d */ 1774 1775 asm volatile("vmaskmovpd (%ecx),%ymm4,%ymm6"); 1776 asm volatile("vscalefss %xmm4,%xmm5,%xmm6{%k7}"); 1777 asm volatile("vscalefsd %xmm4,%xmm5,%xmm6{%k7}"); 1778 1779 /* AVX-512: Op code 0f 38 30 */ 1780 1781 asm volatile("vpmovzxbw %xmm4,%ymm4"); 1782 asm volatile("vpmovwb %zmm5,%ymm6{%k7}"); 1783 1784 /* AVX-512: Op code 0f 38 31 */ 1785 1786 asm volatile("vpmovzxbd %xmm4,%ymm6"); 1787 asm volatile("vpmovdb %zmm5,%xmm6{%k7}"); 1788 1789 /* AVX-512: Op code 0f 38 32 */ 1790 1791 asm volatile("vpmovzxbq %xmm4,%ymm4"); 1792 asm volatile("vpmovqb %zmm5,%xmm6{%k7}"); 1793 1794 /* AVX-512: Op code 0f 38 33 */ 1795 1796 asm volatile("vpmovzxwd %xmm4,%ymm4"); 1797 asm volatile("vpmovdw %zmm5,%ymm6{%k7}"); 1798 1799 /* AVX-512: Op code 0f 38 34 */ 1800 1801 asm volatile("vpmovzxwq %xmm4,%ymm6"); 1802 asm volatile("vpmovqw %zmm5,%xmm6{%k7}"); 1803 1804 /* AVX-512: Op code 0f 38 35 */ 1805 1806 asm volatile("vpmovzxdq %xmm4,%ymm4"); 1807 asm volatile("vpmovqd %zmm5,%ymm6{%k7}"); 1808 1809 /* AVX-512: Op code 0f 38 36 */ 1810 1811 asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 1812 asm volatile("vpermd %ymm4,%ymm6,%ymm2{%k7}"); 1813 asm volatile("vpermq %ymm4,%ymm6,%ymm2{%k7}"); 1814 1815 /* AVX-512: Op code 0f 38 38 */ 1816 1817 asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 1818 asm volatile("vpmovm2d %k5,%zmm6"); 1819 asm volatile("vpmovm2q %k5,%zmm6"); 1820 1821 /* AVX-512: Op code 0f 38 39 */ 1822 1823 asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 1824 asm volatile("vpminsd %zmm4,%zmm5,%zmm6"); 1825 asm volatile("vpminsq %zmm4,%zmm5,%zmm6"); 1826 asm volatile("vpmovd2m %zmm6,%k5"); 1827 asm volatile("vpmovq2m %zmm6,%k5"); 1828 1829 /* AVX-512: Op code 0f 38 3a */ 1830 1831 asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 1832 asm volatile("vpbroadcastmw2d %k6,%zmm6"); 1833 1834 /* AVX-512: Op code 0f 38 3b */ 1835 1836 asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 1837 asm volatile("vpminud %zmm4,%zmm5,%zmm6"); 1838 asm volatile("vpminuq %zmm4,%zmm5,%zmm6"); 1839 1840 /* AVX-512: Op code 0f 38 3d */ 1841 1842 asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 1843 asm volatile("vpmaxsd %zmm4,%zmm5,%zmm6"); 1844 asm volatile("vpmaxsq %zmm4,%zmm5,%zmm6"); 1845 1846 /* AVX-512: Op code 0f 38 3f */ 1847 1848 asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 1849 asm volatile("vpmaxud %zmm4,%zmm5,%zmm6"); 1850 asm volatile("vpmaxuq %zmm4,%zmm5,%zmm6"); 1851 1852 /* AVX-512: Op code 0f 38 40 */ 1853 1854 asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 1855 asm volatile("vpmulld %zmm4,%zmm5,%zmm6"); 1856 asm volatile("vpmullq %zmm4,%zmm5,%zmm6"); 1857 1858 /* AVX-512: Op code 0f 38 42 */ 1859 1860 asm volatile("vgetexpps %zmm5,%zmm6"); 1861 asm volatile("vgetexppd %zmm5,%zmm6"); 1862 1863 /* AVX-512: Op code 0f 38 43 */ 1864 1865 asm volatile("vgetexpss %xmm4,%xmm5,%xmm6{%k7}"); 1866 asm volatile("vgetexpsd %xmm2,%xmm3,%xmm4{%k7}"); 1867 1868 /* AVX-512: Op code 0f 38 44 */ 1869 1870 asm volatile("vplzcntd %zmm5,%zmm6"); 1871 asm volatile("vplzcntq %zmm5,%zmm6"); 1872 1873 /* AVX-512: Op code 0f 38 46 */ 1874 1875 asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 1876 asm volatile("vpsravd %zmm4,%zmm5,%zmm6"); 1877 asm volatile("vpsravq %zmm4,%zmm5,%zmm6"); 1878 1879 /* AVX-512: Op code 0f 38 4c */ 1880 1881 asm volatile("vrcp14ps %zmm5,%zmm6"); 1882 asm volatile("vrcp14pd %zmm5,%zmm6"); 1883 1884 /* AVX-512: Op code 0f 38 4d */ 1885 1886 asm volatile("vrcp14ss %xmm4,%xmm5,%xmm6{%k7}"); 1887 asm volatile("vrcp14sd %xmm4,%xmm5,%xmm6{%k7}"); 1888 1889 /* AVX-512: Op code 0f 38 4e */ 1890 1891 asm volatile("vrsqrt14ps %zmm5,%zmm6"); 1892 asm volatile("vrsqrt14pd %zmm5,%zmm6"); 1893 1894 /* AVX-512: Op code 0f 38 4f */ 1895 1896 asm volatile("vrsqrt14ss %xmm4,%xmm5,%xmm6{%k7}"); 1897 asm volatile("vrsqrt14sd %xmm4,%xmm5,%xmm6{%k7}"); 1898 1899 /* AVX-512: Op code 0f 38 59 */ 1900 1901 asm volatile("vpbroadcastq %xmm4,%xmm6"); 1902 asm volatile("vbroadcasti32x2 %xmm7,%zmm6"); 1903 1904 /* AVX-512: Op code 0f 38 5a */ 1905 1906 asm volatile("vbroadcasti128 (%ecx),%ymm4"); 1907 asm volatile("vbroadcasti32x4 (%ecx),%zmm6"); 1908 asm volatile("vbroadcasti64x2 (%ecx),%zmm6"); 1909 1910 /* AVX-512: Op code 0f 38 5b */ 1911 1912 asm volatile("vbroadcasti32x8 (%ecx),%zmm6"); 1913 asm volatile("vbroadcasti64x4 (%ecx),%zmm6"); 1914 1915 /* AVX-512: Op code 0f 38 64 */ 1916 1917 asm volatile("vpblendmd %zmm4,%zmm5,%zmm6"); 1918 asm volatile("vpblendmq %zmm4,%zmm5,%zmm6"); 1919 1920 /* AVX-512: Op code 0f 38 65 */ 1921 1922 asm volatile("vblendmps %zmm4,%zmm5,%zmm6"); 1923 asm volatile("vblendmpd %zmm4,%zmm5,%zmm6"); 1924 1925 /* AVX-512: Op code 0f 38 66 */ 1926 1927 asm volatile("vpblendmb %zmm4,%zmm5,%zmm6"); 1928 asm volatile("vpblendmw %zmm4,%zmm5,%zmm6"); 1929 1930 /* AVX-512: Op code 0f 38 75 */ 1931 1932 asm volatile("vpermi2b %zmm4,%zmm5,%zmm6"); 1933 asm volatile("vpermi2w %zmm4,%zmm5,%zmm6"); 1934 1935 /* AVX-512: Op code 0f 38 76 */ 1936 1937 asm volatile("vpermi2d %zmm4,%zmm5,%zmm6"); 1938 asm volatile("vpermi2q %zmm4,%zmm5,%zmm6"); 1939 1940 /* AVX-512: Op code 0f 38 77 */ 1941 1942 asm volatile("vpermi2ps %zmm4,%zmm5,%zmm6"); 1943 asm volatile("vpermi2pd %zmm4,%zmm5,%zmm6"); 1944 1945 /* AVX-512: Op code 0f 38 7a */ 1946 1947 asm volatile("vpbroadcastb %eax,%xmm3"); 1948 1949 /* AVX-512: Op code 0f 38 7b */ 1950 1951 asm volatile("vpbroadcastw %eax,%xmm3"); 1952 1953 /* AVX-512: Op code 0f 38 7c */ 1954 1955 asm volatile("vpbroadcastd %eax,%xmm3"); 1956 1957 /* AVX-512: Op code 0f 38 7d */ 1958 1959 asm volatile("vpermt2b %zmm4,%zmm5,%zmm6"); 1960 asm volatile("vpermt2w %zmm4,%zmm5,%zmm6"); 1961 1962 /* AVX-512: Op code 0f 38 7e */ 1963 1964 asm volatile("vpermt2d %zmm4,%zmm5,%zmm6"); 1965 asm volatile("vpermt2q %zmm4,%zmm5,%zmm6"); 1966 1967 /* AVX-512: Op code 0f 38 7f */ 1968 1969 asm volatile("vpermt2ps %zmm4,%zmm5,%zmm6"); 1970 asm volatile("vpermt2pd %zmm4,%zmm5,%zmm6"); 1971 1972 /* AVX-512: Op code 0f 38 83 */ 1973 1974 asm volatile("vpmultishiftqb %zmm4,%zmm5,%zmm6"); 1975 1976 /* AVX-512: Op code 0f 38 88 */ 1977 1978 asm volatile("vexpandps (%ecx),%zmm6"); 1979 asm volatile("vexpandpd (%ecx),%zmm6"); 1980 1981 /* AVX-512: Op code 0f 38 89 */ 1982 1983 asm volatile("vpexpandd (%ecx),%zmm6"); 1984 asm volatile("vpexpandq (%ecx),%zmm6"); 1985 1986 /* AVX-512: Op code 0f 38 8a */ 1987 1988 asm volatile("vcompressps %zmm6,(%ecx)"); 1989 asm volatile("vcompresspd %zmm6,(%ecx)"); 1990 1991 /* AVX-512: Op code 0f 38 8b */ 1992 1993 asm volatile("vpcompressd %zmm6,(%ecx)"); 1994 asm volatile("vpcompressq %zmm6,(%ecx)"); 1995 1996 /* AVX-512: Op code 0f 38 8d */ 1997 1998 asm volatile("vpermb %zmm4,%zmm5,%zmm6"); 1999 asm volatile("vpermw %zmm4,%zmm5,%zmm6"); 2000 2001 /* AVX-512: Op code 0f 38 90 */ 2002 2003 asm volatile("vpgatherdd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 2004 asm volatile("vpgatherdq %xmm2,0x04(%ebp,%xmm7,2),%xmm1"); 2005 asm volatile("vpgatherdd 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 2006 asm volatile("vpgatherdq 0x7b(%ebp,%ymm7,8),%zmm6{%k1}"); 2007 2008 /* AVX-512: Op code 0f 38 91 */ 2009 2010 asm volatile("vpgatherqd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 2011 asm volatile("vpgatherqq %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 2012 asm volatile("vpgatherqd 0x7b(%ebp,%zmm7,8),%ymm6{%k1}"); 2013 asm volatile("vpgatherqq 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 2014 2015 /* AVX-512: Op code 0f 38 a0 */ 2016 2017 asm volatile("vpscatterdd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2018 asm volatile("vpscatterdq %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 2019 2020 /* AVX-512: Op code 0f 38 a1 */ 2021 2022 asm volatile("vpscatterqd %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 2023 asm volatile("vpscatterqq %ymm6,0x7b(%ebp,%ymm7,8){%k1}"); 2024 2025 /* AVX-512: Op code 0f 38 a2 */ 2026 2027 asm volatile("vscatterdps %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2028 asm volatile("vscatterdpd %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 2029 2030 /* AVX-512: Op code 0f 38 a3 */ 2031 2032 asm volatile("vscatterqps %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 2033 asm volatile("vscatterqpd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 2034 2035 /* AVX-512: Op code 0f 38 b4 */ 2036 2037 asm volatile("vpmadd52luq %zmm4,%zmm5,%zmm6"); 2038 2039 /* AVX-512: Op code 0f 38 b5 */ 2040 2041 asm volatile("vpmadd52huq %zmm4,%zmm5,%zmm6"); 2042 2043 /* AVX-512: Op code 0f 38 c4 */ 2044 2045 asm volatile("vpconflictd %zmm5,%zmm6"); 2046 asm volatile("vpconflictq %zmm5,%zmm6"); 2047 2048 /* AVX-512: Op code 0f 38 c8 */ 2049 2050 asm volatile("vexp2ps %zmm6,%zmm7"); 2051 asm volatile("vexp2pd %zmm6,%zmm7"); 2052 2053 /* AVX-512: Op code 0f 38 ca */ 2054 2055 asm volatile("vrcp28ps %zmm6,%zmm7"); 2056 asm volatile("vrcp28pd %zmm6,%zmm7"); 2057 2058 /* AVX-512: Op code 0f 38 cb */ 2059 2060 asm volatile("vrcp28ss %xmm5,%xmm6,%xmm7{%k7}"); 2061 asm volatile("vrcp28sd %xmm5,%xmm6,%xmm7{%k7}"); 2062 2063 /* AVX-512: Op code 0f 38 cc */ 2064 2065 asm volatile("vrsqrt28ps %zmm6,%zmm7"); 2066 asm volatile("vrsqrt28pd %zmm6,%zmm7"); 2067 2068 /* AVX-512: Op code 0f 38 cd */ 2069 2070 asm volatile("vrsqrt28ss %xmm5,%xmm6,%xmm7{%k7}"); 2071 asm volatile("vrsqrt28sd %xmm5,%xmm6,%xmm7{%k7}"); 2072 2073 /* AVX-512: Op code 0f 3a 03 */ 2074 2075 asm volatile("valignd $0x12,%zmm5,%zmm6,%zmm7"); 2076 asm volatile("valignq $0x12,%zmm5,%zmm6,%zmm7"); 2077 2078 /* AVX-512: Op code 0f 3a 08 */ 2079 2080 asm volatile("vroundps $0x5,%ymm6,%ymm2"); 2081 asm volatile("vrndscaleps $0x12,%zmm5,%zmm6"); 2082 2083 /* AVX-512: Op code 0f 3a 09 */ 2084 2085 asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 2086 asm volatile("vrndscalepd $0x12,%zmm5,%zmm6"); 2087 2088 /* AVX-512: Op code 0f 3a 0a */ 2089 2090 asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 2091 asm volatile("vrndscaless $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 2092 2093 /* AVX-512: Op code 0f 3a 0b */ 2094 2095 asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 2096 asm volatile("vrndscalesd $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 2097 2098 /* AVX-512: Op code 0f 3a 18 */ 2099 2100 asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 2101 asm volatile("vinsertf32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2102 asm volatile("vinsertf64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2103 2104 /* AVX-512: Op code 0f 3a 19 */ 2105 2106 asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 2107 asm volatile("vextractf32x4 $0x12,%zmm5,%xmm6{%k7}"); 2108 asm volatile("vextractf64x2 $0x12,%zmm5,%xmm6{%k7}"); 2109 2110 /* AVX-512: Op code 0f 3a 1a */ 2111 2112 asm volatile("vinsertf32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2113 asm volatile("vinsertf64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2114 2115 /* AVX-512: Op code 0f 3a 1b */ 2116 2117 asm volatile("vextractf32x8 $0x12,%zmm6,%ymm7{%k7}"); 2118 asm volatile("vextractf64x4 $0x12,%zmm6,%ymm7{%k7}"); 2119 2120 /* AVX-512: Op code 0f 3a 1e */ 2121 2122 asm volatile("vpcmpud $0x12,%zmm6,%zmm7,%k5"); 2123 asm volatile("vpcmpuq $0x12,%zmm6,%zmm7,%k5"); 2124 2125 /* AVX-512: Op code 0f 3a 1f */ 2126 2127 asm volatile("vpcmpd $0x12,%zmm6,%zmm7,%k5"); 2128 asm volatile("vpcmpq $0x12,%zmm6,%zmm7,%k5"); 2129 2130 /* AVX-512: Op code 0f 3a 23 */ 2131 2132 asm volatile("vshuff32x4 $0x12,%zmm5,%zmm6,%zmm7"); 2133 asm volatile("vshuff64x2 $0x12,%zmm5,%zmm6,%zmm7"); 2134 2135 /* AVX-512: Op code 0f 3a 25 */ 2136 2137 asm volatile("vpternlogd $0x12,%zmm5,%zmm6,%zmm7"); 2138 asm volatile("vpternlogq $0x12,%zmm5,%zmm6,%zmm7"); 2139 2140 /* AVX-512: Op code 0f 3a 26 */ 2141 2142 asm volatile("vgetmantps $0x12,%zmm6,%zmm7"); 2143 asm volatile("vgetmantpd $0x12,%zmm6,%zmm7"); 2144 2145 /* AVX-512: Op code 0f 3a 27 */ 2146 2147 asm volatile("vgetmantss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2148 asm volatile("vgetmantsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2149 2150 /* AVX-512: Op code 0f 3a 38 */ 2151 2152 asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 2153 asm volatile("vinserti32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2154 asm volatile("vinserti64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 2155 2156 /* AVX-512: Op code 0f 3a 39 */ 2157 2158 asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 2159 asm volatile("vextracti32x4 $0x12,%zmm5,%xmm6{%k7}"); 2160 asm volatile("vextracti64x2 $0x12,%zmm5,%xmm6{%k7}"); 2161 2162 /* AVX-512: Op code 0f 3a 3a */ 2163 2164 asm volatile("vinserti32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2165 asm volatile("vinserti64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 2166 2167 /* AVX-512: Op code 0f 3a 3b */ 2168 2169 asm volatile("vextracti32x8 $0x12,%zmm6,%ymm7{%k7}"); 2170 asm volatile("vextracti64x4 $0x12,%zmm6,%ymm7{%k7}"); 2171 2172 /* AVX-512: Op code 0f 3a 3e */ 2173 2174 asm volatile("vpcmpub $0x12,%zmm6,%zmm7,%k5"); 2175 asm volatile("vpcmpuw $0x12,%zmm6,%zmm7,%k5"); 2176 2177 /* AVX-512: Op code 0f 3a 3f */ 2178 2179 asm volatile("vpcmpb $0x12,%zmm6,%zmm7,%k5"); 2180 asm volatile("vpcmpw $0x12,%zmm6,%zmm7,%k5"); 2181 2182 /* AVX-512: Op code 0f 3a 42 */ 2183 2184 asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 2185 asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 2186 2187 /* AVX-512: Op code 0f 3a 43 */ 2188 2189 asm volatile("vshufi32x4 $0x12,%zmm5,%zmm6,%zmm7"); 2190 asm volatile("vshufi64x2 $0x12,%zmm5,%zmm6,%zmm7"); 2191 2192 /* AVX-512: Op code 0f 3a 50 */ 2193 2194 asm volatile("vrangeps $0x12,%zmm5,%zmm6,%zmm7"); 2195 asm volatile("vrangepd $0x12,%zmm5,%zmm6,%zmm7"); 2196 2197 /* AVX-512: Op code 0f 3a 51 */ 2198 2199 asm volatile("vrangess $0x12,%xmm5,%xmm6,%xmm7"); 2200 asm volatile("vrangesd $0x12,%xmm5,%xmm6,%xmm7"); 2201 2202 /* AVX-512: Op code 0f 3a 54 */ 2203 2204 asm volatile("vfixupimmps $0x12,%zmm5,%zmm6,%zmm7"); 2205 asm volatile("vfixupimmpd $0x12,%zmm5,%zmm6,%zmm7"); 2206 2207 /* AVX-512: Op code 0f 3a 55 */ 2208 2209 asm volatile("vfixupimmss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2210 asm volatile("vfixupimmsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 2211 2212 /* AVX-512: Op code 0f 3a 56 */ 2213 2214 asm volatile("vreduceps $0x12,%zmm6,%zmm7"); 2215 asm volatile("vreducepd $0x12,%zmm6,%zmm7"); 2216 2217 /* AVX-512: Op code 0f 3a 57 */ 2218 2219 asm volatile("vreducess $0x12,%xmm5,%xmm6,%xmm7"); 2220 asm volatile("vreducesd $0x12,%xmm5,%xmm6,%xmm7"); 2221 2222 /* AVX-512: Op code 0f 3a 66 */ 2223 2224 asm volatile("vfpclassps $0x12,%zmm7,%k5"); 2225 asm volatile("vfpclasspd $0x12,%zmm7,%k5"); 2226 2227 /* AVX-512: Op code 0f 3a 67 */ 2228 2229 asm volatile("vfpclassss $0x12,%xmm7,%k5"); 2230 asm volatile("vfpclasssd $0x12,%xmm7,%k5"); 2231 2232 /* AVX-512: Op code 0f 72 (Grp13) */ 2233 2234 asm volatile("vprord $0x12,%zmm5,%zmm6"); 2235 asm volatile("vprorq $0x12,%zmm5,%zmm6"); 2236 asm volatile("vprold $0x12,%zmm5,%zmm6"); 2237 asm volatile("vprolq $0x12,%zmm5,%zmm6"); 2238 asm volatile("psrad $0x2,%mm6"); 2239 asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 2240 asm volatile("vpsrad $0x5,%zmm6,%zmm2"); 2241 asm volatile("vpsraq $0x5,%zmm6,%zmm2"); 2242 2243 /* AVX-512: Op code 0f 38 c6 (Grp18) */ 2244 2245 asm volatile("vgatherpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 2246 asm volatile("vgatherpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2247 asm volatile("vgatherpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 2248 asm volatile("vgatherpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2249 asm volatile("vscatterpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 2250 asm volatile("vscatterpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2251 asm volatile("vscatterpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 2252 asm volatile("vscatterpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 2253 2254 /* AVX-512: Op code 0f 38 c7 (Grp19) */ 2255 2256 asm volatile("vgatherpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 2257 asm volatile("vgatherpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2258 asm volatile("vgatherpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 2259 asm volatile("vgatherpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2260 asm volatile("vscatterpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 2261 asm volatile("vscatterpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2262 asm volatile("vscatterpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 2263 asm volatile("vscatterpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 2264 2265 /* AVX-512: Examples */ 2266 2267 asm volatile("vaddpd %zmm4,%zmm5,%zmm6"); 2268 asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}"); 2269 asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}{z}"); 2270 asm volatile("vaddpd {rn-sae},%zmm4,%zmm5,%zmm6"); 2271 asm volatile("vaddpd {ru-sae},%zmm4,%zmm5,%zmm6"); 2272 asm volatile("vaddpd {rd-sae},%zmm4,%zmm5,%zmm6"); 2273 asm volatile("vaddpd {rz-sae},%zmm4,%zmm5,%zmm6"); 2274 asm volatile("vaddpd (%ecx),%zmm5,%zmm6"); 2275 asm volatile("vaddpd 0x123(%eax,%ecx,8),%zmm5,%zmm6"); 2276 asm volatile("vaddpd (%ecx){1to8},%zmm5,%zmm6"); 2277 asm volatile("vaddpd 0x1fc0(%edx),%zmm5,%zmm6"); 2278 asm volatile("vaddpd 0x3f8(%edx){1to8},%zmm5,%zmm6"); 2279 asm volatile("vcmpeq_uqps 0x1fc(%edx){1to16},%zmm6,%k5"); 2280 asm volatile("vcmpltsd 0x123(%eax,%ecx,8),%xmm3,%k5{%k7}"); 2281 asm volatile("vcmplesd {sae},%xmm4,%xmm5,%k5{%k7}"); 2282 asm volatile("vgetmantss $0x5b,0x123(%eax,%ecx,8),%xmm4,%xmm5{%k7}"); 2283 2284 /* bndmk m32, bnd */ 2285 2286 asm volatile("bndmk (%eax), %bnd0"); 2287 asm volatile("bndmk (0x12345678), %bnd0"); 2288 asm volatile("bndmk (%eax), %bnd3"); 2289 asm volatile("bndmk (%ecx,%eax,1), %bnd0"); 2290 asm volatile("bndmk 0x12345678(,%eax,1), %bnd0"); 2291 asm volatile("bndmk (%eax,%ecx,1), %bnd0"); 2292 asm volatile("bndmk (%eax,%ecx,8), %bnd0"); 2293 asm volatile("bndmk 0x12(%eax), %bnd0"); 2294 asm volatile("bndmk 0x12(%ebp), %bnd0"); 2295 asm volatile("bndmk 0x12(%ecx,%eax,1), %bnd0"); 2296 asm volatile("bndmk 0x12(%ebp,%eax,1), %bnd0"); 2297 asm volatile("bndmk 0x12(%eax,%ecx,1), %bnd0"); 2298 asm volatile("bndmk 0x12(%eax,%ecx,8), %bnd0"); 2299 asm volatile("bndmk 0x12345678(%eax), %bnd0"); 2300 asm volatile("bndmk 0x12345678(%ebp), %bnd0"); 2301 asm volatile("bndmk 0x12345678(%ecx,%eax,1), %bnd0"); 2302 asm volatile("bndmk 0x12345678(%ebp,%eax,1), %bnd0"); 2303 asm volatile("bndmk 0x12345678(%eax,%ecx,1), %bnd0"); 2304 asm volatile("bndmk 0x12345678(%eax,%ecx,8), %bnd0"); 2305 2306 /* bndcl r/m32, bnd */ 2307 2308 asm volatile("bndcl (%eax), %bnd0"); 2309 asm volatile("bndcl (0x12345678), %bnd0"); 2310 asm volatile("bndcl (%eax), %bnd3"); 2311 asm volatile("bndcl (%ecx,%eax,1), %bnd0"); 2312 asm volatile("bndcl 0x12345678(,%eax,1), %bnd0"); 2313 asm volatile("bndcl (%eax,%ecx,1), %bnd0"); 2314 asm volatile("bndcl (%eax,%ecx,8), %bnd0"); 2315 asm volatile("bndcl 0x12(%eax), %bnd0"); 2316 asm volatile("bndcl 0x12(%ebp), %bnd0"); 2317 asm volatile("bndcl 0x12(%ecx,%eax,1), %bnd0"); 2318 asm volatile("bndcl 0x12(%ebp,%eax,1), %bnd0"); 2319 asm volatile("bndcl 0x12(%eax,%ecx,1), %bnd0"); 2320 asm volatile("bndcl 0x12(%eax,%ecx,8), %bnd0"); 2321 asm volatile("bndcl 0x12345678(%eax), %bnd0"); 2322 asm volatile("bndcl 0x12345678(%ebp), %bnd0"); 2323 asm volatile("bndcl 0x12345678(%ecx,%eax,1), %bnd0"); 2324 asm volatile("bndcl 0x12345678(%ebp,%eax,1), %bnd0"); 2325 asm volatile("bndcl 0x12345678(%eax,%ecx,1), %bnd0"); 2326 asm volatile("bndcl 0x12345678(%eax,%ecx,8), %bnd0"); 2327 asm volatile("bndcl %eax, %bnd0"); 2328 2329 /* bndcu r/m32, bnd */ 2330 2331 asm volatile("bndcu (%eax), %bnd0"); 2332 asm volatile("bndcu (0x12345678), %bnd0"); 2333 asm volatile("bndcu (%eax), %bnd3"); 2334 asm volatile("bndcu (%ecx,%eax,1), %bnd0"); 2335 asm volatile("bndcu 0x12345678(,%eax,1), %bnd0"); 2336 asm volatile("bndcu (%eax,%ecx,1), %bnd0"); 2337 asm volatile("bndcu (%eax,%ecx,8), %bnd0"); 2338 asm volatile("bndcu 0x12(%eax), %bnd0"); 2339 asm volatile("bndcu 0x12(%ebp), %bnd0"); 2340 asm volatile("bndcu 0x12(%ecx,%eax,1), %bnd0"); 2341 asm volatile("bndcu 0x12(%ebp,%eax,1), %bnd0"); 2342 asm volatile("bndcu 0x12(%eax,%ecx,1), %bnd0"); 2343 asm volatile("bndcu 0x12(%eax,%ecx,8), %bnd0"); 2344 asm volatile("bndcu 0x12345678(%eax), %bnd0"); 2345 asm volatile("bndcu 0x12345678(%ebp), %bnd0"); 2346 asm volatile("bndcu 0x12345678(%ecx,%eax,1), %bnd0"); 2347 asm volatile("bndcu 0x12345678(%ebp,%eax,1), %bnd0"); 2348 asm volatile("bndcu 0x12345678(%eax,%ecx,1), %bnd0"); 2349 asm volatile("bndcu 0x12345678(%eax,%ecx,8), %bnd0"); 2350 asm volatile("bndcu %eax, %bnd0"); 2351 2352 /* bndcn r/m32, bnd */ 2353 2354 asm volatile("bndcn (%eax), %bnd0"); 2355 asm volatile("bndcn (0x12345678), %bnd0"); 2356 asm volatile("bndcn (%eax), %bnd3"); 2357 asm volatile("bndcn (%ecx,%eax,1), %bnd0"); 2358 asm volatile("bndcn 0x12345678(,%eax,1), %bnd0"); 2359 asm volatile("bndcn (%eax,%ecx,1), %bnd0"); 2360 asm volatile("bndcn (%eax,%ecx,8), %bnd0"); 2361 asm volatile("bndcn 0x12(%eax), %bnd0"); 2362 asm volatile("bndcn 0x12(%ebp), %bnd0"); 2363 asm volatile("bndcn 0x12(%ecx,%eax,1), %bnd0"); 2364 asm volatile("bndcn 0x12(%ebp,%eax,1), %bnd0"); 2365 asm volatile("bndcn 0x12(%eax,%ecx,1), %bnd0"); 2366 asm volatile("bndcn 0x12(%eax,%ecx,8), %bnd0"); 2367 asm volatile("bndcn 0x12345678(%eax), %bnd0"); 2368 asm volatile("bndcn 0x12345678(%ebp), %bnd0"); 2369 asm volatile("bndcn 0x12345678(%ecx,%eax,1), %bnd0"); 2370 asm volatile("bndcn 0x12345678(%ebp,%eax,1), %bnd0"); 2371 asm volatile("bndcn 0x12345678(%eax,%ecx,1), %bnd0"); 2372 asm volatile("bndcn 0x12345678(%eax,%ecx,8), %bnd0"); 2373 asm volatile("bndcn %eax, %bnd0"); 2374 2375 /* bndmov m64, bnd */ 2376 2377 asm volatile("bndmov (%eax), %bnd0"); 2378 asm volatile("bndmov (0x12345678), %bnd0"); 2379 asm volatile("bndmov (%eax), %bnd3"); 2380 asm volatile("bndmov (%ecx,%eax,1), %bnd0"); 2381 asm volatile("bndmov 0x12345678(,%eax,1), %bnd0"); 2382 asm volatile("bndmov (%eax,%ecx,1), %bnd0"); 2383 asm volatile("bndmov (%eax,%ecx,8), %bnd0"); 2384 asm volatile("bndmov 0x12(%eax), %bnd0"); 2385 asm volatile("bndmov 0x12(%ebp), %bnd0"); 2386 asm volatile("bndmov 0x12(%ecx,%eax,1), %bnd0"); 2387 asm volatile("bndmov 0x12(%ebp,%eax,1), %bnd0"); 2388 asm volatile("bndmov 0x12(%eax,%ecx,1), %bnd0"); 2389 asm volatile("bndmov 0x12(%eax,%ecx,8), %bnd0"); 2390 asm volatile("bndmov 0x12345678(%eax), %bnd0"); 2391 asm volatile("bndmov 0x12345678(%ebp), %bnd0"); 2392 asm volatile("bndmov 0x12345678(%ecx,%eax,1), %bnd0"); 2393 asm volatile("bndmov 0x12345678(%ebp,%eax,1), %bnd0"); 2394 asm volatile("bndmov 0x12345678(%eax,%ecx,1), %bnd0"); 2395 asm volatile("bndmov 0x12345678(%eax,%ecx,8), %bnd0"); 2396 2397 /* bndmov bnd, m64 */ 2398 2399 asm volatile("bndmov %bnd0, (%eax)"); 2400 asm volatile("bndmov %bnd0, (0x12345678)"); 2401 asm volatile("bndmov %bnd3, (%eax)"); 2402 asm volatile("bndmov %bnd0, (%ecx,%eax,1)"); 2403 asm volatile("bndmov %bnd0, 0x12345678(,%eax,1)"); 2404 asm volatile("bndmov %bnd0, (%eax,%ecx,1)"); 2405 asm volatile("bndmov %bnd0, (%eax,%ecx,8)"); 2406 asm volatile("bndmov %bnd0, 0x12(%eax)"); 2407 asm volatile("bndmov %bnd0, 0x12(%ebp)"); 2408 asm volatile("bndmov %bnd0, 0x12(%ecx,%eax,1)"); 2409 asm volatile("bndmov %bnd0, 0x12(%ebp,%eax,1)"); 2410 asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,1)"); 2411 asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,8)"); 2412 asm volatile("bndmov %bnd0, 0x12345678(%eax)"); 2413 asm volatile("bndmov %bnd0, 0x12345678(%ebp)"); 2414 asm volatile("bndmov %bnd0, 0x12345678(%ecx,%eax,1)"); 2415 asm volatile("bndmov %bnd0, 0x12345678(%ebp,%eax,1)"); 2416 asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,1)"); 2417 asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,8)"); 2418 2419 /* bndmov bnd2, bnd1 */ 2420 2421 asm volatile("bndmov %bnd0, %bnd1"); 2422 asm volatile("bndmov %bnd1, %bnd0"); 2423 2424 /* bndldx mib, bnd */ 2425 2426 asm volatile("bndldx (%eax), %bnd0"); 2427 asm volatile("bndldx (0x12345678), %bnd0"); 2428 asm volatile("bndldx (%eax), %bnd3"); 2429 asm volatile("bndldx (%ecx,%eax,1), %bnd0"); 2430 asm volatile("bndldx 0x12345678(,%eax,1), %bnd0"); 2431 asm volatile("bndldx (%eax,%ecx,1), %bnd0"); 2432 asm volatile("bndldx 0x12(%eax), %bnd0"); 2433 asm volatile("bndldx 0x12(%ebp), %bnd0"); 2434 asm volatile("bndldx 0x12(%ecx,%eax,1), %bnd0"); 2435 asm volatile("bndldx 0x12(%ebp,%eax,1), %bnd0"); 2436 asm volatile("bndldx 0x12(%eax,%ecx,1), %bnd0"); 2437 asm volatile("bndldx 0x12345678(%eax), %bnd0"); 2438 asm volatile("bndldx 0x12345678(%ebp), %bnd0"); 2439 asm volatile("bndldx 0x12345678(%ecx,%eax,1), %bnd0"); 2440 asm volatile("bndldx 0x12345678(%ebp,%eax,1), %bnd0"); 2441 asm volatile("bndldx 0x12345678(%eax,%ecx,1), %bnd0"); 2442 2443 /* bndstx bnd, mib */ 2444 2445 asm volatile("bndstx %bnd0, (%eax)"); 2446 asm volatile("bndstx %bnd0, (0x12345678)"); 2447 asm volatile("bndstx %bnd3, (%eax)"); 2448 asm volatile("bndstx %bnd0, (%ecx,%eax,1)"); 2449 asm volatile("bndstx %bnd0, 0x12345678(,%eax,1)"); 2450 asm volatile("bndstx %bnd0, (%eax,%ecx,1)"); 2451 asm volatile("bndstx %bnd0, 0x12(%eax)"); 2452 asm volatile("bndstx %bnd0, 0x12(%ebp)"); 2453 asm volatile("bndstx %bnd0, 0x12(%ecx,%eax,1)"); 2454 asm volatile("bndstx %bnd0, 0x12(%ebp,%eax,1)"); 2455 asm volatile("bndstx %bnd0, 0x12(%eax,%ecx,1)"); 2456 asm volatile("bndstx %bnd0, 0x12345678(%eax)"); 2457 asm volatile("bndstx %bnd0, 0x12345678(%ebp)"); 2458 asm volatile("bndstx %bnd0, 0x12345678(%ecx,%eax,1)"); 2459 asm volatile("bndstx %bnd0, 0x12345678(%ebp,%eax,1)"); 2460 asm volatile("bndstx %bnd0, 0x12345678(%eax,%ecx,1)"); 2461 2462 /* bnd prefix on call, ret, jmp and all jcc */ 2463 2464 asm volatile("bnd call label1"); /* Expecting: call unconditional 0xfffffffc */ 2465 asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 2466 asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 2467 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 2468 asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 2469 asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 2470 asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0xfffffffc */ 2471 2472 /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 2473 2474 asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 2475 asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 2476 asm volatile("sha1rnds4 $0x91, (%eax), %xmm0"); 2477 asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 2478 asm volatile("sha1rnds4 $0x91, (%eax), %xmm3"); 2479 asm volatile("sha1rnds4 $0x91, (%ecx,%eax,1), %xmm0"); 2480 asm volatile("sha1rnds4 $0x91, 0x12345678(,%eax,1), %xmm0"); 2481 asm volatile("sha1rnds4 $0x91, (%eax,%ecx,1), %xmm0"); 2482 asm volatile("sha1rnds4 $0x91, (%eax,%ecx,8), %xmm0"); 2483 asm volatile("sha1rnds4 $0x91, 0x12(%eax), %xmm0"); 2484 asm volatile("sha1rnds4 $0x91, 0x12(%ebp), %xmm0"); 2485 asm volatile("sha1rnds4 $0x91, 0x12(%ecx,%eax,1), %xmm0"); 2486 asm volatile("sha1rnds4 $0x91, 0x12(%ebp,%eax,1), %xmm0"); 2487 asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,1), %xmm0"); 2488 asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,8), %xmm0"); 2489 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax), %xmm0"); 2490 asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp), %xmm0"); 2491 asm volatile("sha1rnds4 $0x91, 0x12345678(%ecx,%eax,1), %xmm0"); 2492 asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp,%eax,1), %xmm0"); 2493 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,1), %xmm0"); 2494 asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,8), %xmm0"); 2495 2496 /* sha1nexte xmm2/m128, xmm1 */ 2497 2498 asm volatile("sha1nexte %xmm1, %xmm0"); 2499 asm volatile("sha1nexte %xmm7, %xmm2"); 2500 asm volatile("sha1nexte (%eax), %xmm0"); 2501 asm volatile("sha1nexte (0x12345678), %xmm0"); 2502 asm volatile("sha1nexte (%eax), %xmm3"); 2503 asm volatile("sha1nexte (%ecx,%eax,1), %xmm0"); 2504 asm volatile("sha1nexte 0x12345678(,%eax,1), %xmm0"); 2505 asm volatile("sha1nexte (%eax,%ecx,1), %xmm0"); 2506 asm volatile("sha1nexte (%eax,%ecx,8), %xmm0"); 2507 asm volatile("sha1nexte 0x12(%eax), %xmm0"); 2508 asm volatile("sha1nexte 0x12(%ebp), %xmm0"); 2509 asm volatile("sha1nexte 0x12(%ecx,%eax,1), %xmm0"); 2510 asm volatile("sha1nexte 0x12(%ebp,%eax,1), %xmm0"); 2511 asm volatile("sha1nexte 0x12(%eax,%ecx,1), %xmm0"); 2512 asm volatile("sha1nexte 0x12(%eax,%ecx,8), %xmm0"); 2513 asm volatile("sha1nexte 0x12345678(%eax), %xmm0"); 2514 asm volatile("sha1nexte 0x12345678(%ebp), %xmm0"); 2515 asm volatile("sha1nexte 0x12345678(%ecx,%eax,1), %xmm0"); 2516 asm volatile("sha1nexte 0x12345678(%ebp,%eax,1), %xmm0"); 2517 asm volatile("sha1nexte 0x12345678(%eax,%ecx,1), %xmm0"); 2518 asm volatile("sha1nexte 0x12345678(%eax,%ecx,8), %xmm0"); 2519 2520 /* sha1msg1 xmm2/m128, xmm1 */ 2521 2522 asm volatile("sha1msg1 %xmm1, %xmm0"); 2523 asm volatile("sha1msg1 %xmm7, %xmm2"); 2524 asm volatile("sha1msg1 (%eax), %xmm0"); 2525 asm volatile("sha1msg1 (0x12345678), %xmm0"); 2526 asm volatile("sha1msg1 (%eax), %xmm3"); 2527 asm volatile("sha1msg1 (%ecx,%eax,1), %xmm0"); 2528 asm volatile("sha1msg1 0x12345678(,%eax,1), %xmm0"); 2529 asm volatile("sha1msg1 (%eax,%ecx,1), %xmm0"); 2530 asm volatile("sha1msg1 (%eax,%ecx,8), %xmm0"); 2531 asm volatile("sha1msg1 0x12(%eax), %xmm0"); 2532 asm volatile("sha1msg1 0x12(%ebp), %xmm0"); 2533 asm volatile("sha1msg1 0x12(%ecx,%eax,1), %xmm0"); 2534 asm volatile("sha1msg1 0x12(%ebp,%eax,1), %xmm0"); 2535 asm volatile("sha1msg1 0x12(%eax,%ecx,1), %xmm0"); 2536 asm volatile("sha1msg1 0x12(%eax,%ecx,8), %xmm0"); 2537 asm volatile("sha1msg1 0x12345678(%eax), %xmm0"); 2538 asm volatile("sha1msg1 0x12345678(%ebp), %xmm0"); 2539 asm volatile("sha1msg1 0x12345678(%ecx,%eax,1), %xmm0"); 2540 asm volatile("sha1msg1 0x12345678(%ebp,%eax,1), %xmm0"); 2541 asm volatile("sha1msg1 0x12345678(%eax,%ecx,1), %xmm0"); 2542 asm volatile("sha1msg1 0x12345678(%eax,%ecx,8), %xmm0"); 2543 2544 /* sha1msg2 xmm2/m128, xmm1 */ 2545 2546 asm volatile("sha1msg2 %xmm1, %xmm0"); 2547 asm volatile("sha1msg2 %xmm7, %xmm2"); 2548 asm volatile("sha1msg2 (%eax), %xmm0"); 2549 asm volatile("sha1msg2 (0x12345678), %xmm0"); 2550 asm volatile("sha1msg2 (%eax), %xmm3"); 2551 asm volatile("sha1msg2 (%ecx,%eax,1), %xmm0"); 2552 asm volatile("sha1msg2 0x12345678(,%eax,1), %xmm0"); 2553 asm volatile("sha1msg2 (%eax,%ecx,1), %xmm0"); 2554 asm volatile("sha1msg2 (%eax,%ecx,8), %xmm0"); 2555 asm volatile("sha1msg2 0x12(%eax), %xmm0"); 2556 asm volatile("sha1msg2 0x12(%ebp), %xmm0"); 2557 asm volatile("sha1msg2 0x12(%ecx,%eax,1), %xmm0"); 2558 asm volatile("sha1msg2 0x12(%ebp,%eax,1), %xmm0"); 2559 asm volatile("sha1msg2 0x12(%eax,%ecx,1), %xmm0"); 2560 asm volatile("sha1msg2 0x12(%eax,%ecx,8), %xmm0"); 2561 asm volatile("sha1msg2 0x12345678(%eax), %xmm0"); 2562 asm volatile("sha1msg2 0x12345678(%ebp), %xmm0"); 2563 asm volatile("sha1msg2 0x12345678(%ecx,%eax,1), %xmm0"); 2564 asm volatile("sha1msg2 0x12345678(%ebp,%eax,1), %xmm0"); 2565 asm volatile("sha1msg2 0x12345678(%eax,%ecx,1), %xmm0"); 2566 asm volatile("sha1msg2 0x12345678(%eax,%ecx,8), %xmm0"); 2567 2568 /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 2569 /* Note sha256rnds2 has an implicit operand 'xmm0' */ 2570 2571 asm volatile("sha256rnds2 %xmm4, %xmm1"); 2572 asm volatile("sha256rnds2 %xmm7, %xmm2"); 2573 asm volatile("sha256rnds2 (%eax), %xmm1"); 2574 asm volatile("sha256rnds2 (0x12345678), %xmm1"); 2575 asm volatile("sha256rnds2 (%eax), %xmm3"); 2576 asm volatile("sha256rnds2 (%ecx,%eax,1), %xmm1"); 2577 asm volatile("sha256rnds2 0x12345678(,%eax,1), %xmm1"); 2578 asm volatile("sha256rnds2 (%eax,%ecx,1), %xmm1"); 2579 asm volatile("sha256rnds2 (%eax,%ecx,8), %xmm1"); 2580 asm volatile("sha256rnds2 0x12(%eax), %xmm1"); 2581 asm volatile("sha256rnds2 0x12(%ebp), %xmm1"); 2582 asm volatile("sha256rnds2 0x12(%ecx,%eax,1), %xmm1"); 2583 asm volatile("sha256rnds2 0x12(%ebp,%eax,1), %xmm1"); 2584 asm volatile("sha256rnds2 0x12(%eax,%ecx,1), %xmm1"); 2585 asm volatile("sha256rnds2 0x12(%eax,%ecx,8), %xmm1"); 2586 asm volatile("sha256rnds2 0x12345678(%eax), %xmm1"); 2587 asm volatile("sha256rnds2 0x12345678(%ebp), %xmm1"); 2588 asm volatile("sha256rnds2 0x12345678(%ecx,%eax,1), %xmm1"); 2589 asm volatile("sha256rnds2 0x12345678(%ebp,%eax,1), %xmm1"); 2590 asm volatile("sha256rnds2 0x12345678(%eax,%ecx,1), %xmm1"); 2591 asm volatile("sha256rnds2 0x12345678(%eax,%ecx,8), %xmm1"); 2592 2593 /* sha256msg1 xmm2/m128, xmm1 */ 2594 2595 asm volatile("sha256msg1 %xmm1, %xmm0"); 2596 asm volatile("sha256msg1 %xmm7, %xmm2"); 2597 asm volatile("sha256msg1 (%eax), %xmm0"); 2598 asm volatile("sha256msg1 (0x12345678), %xmm0"); 2599 asm volatile("sha256msg1 (%eax), %xmm3"); 2600 asm volatile("sha256msg1 (%ecx,%eax,1), %xmm0"); 2601 asm volatile("sha256msg1 0x12345678(,%eax,1), %xmm0"); 2602 asm volatile("sha256msg1 (%eax,%ecx,1), %xmm0"); 2603 asm volatile("sha256msg1 (%eax,%ecx,8), %xmm0"); 2604 asm volatile("sha256msg1 0x12(%eax), %xmm0"); 2605 asm volatile("sha256msg1 0x12(%ebp), %xmm0"); 2606 asm volatile("sha256msg1 0x12(%ecx,%eax,1), %xmm0"); 2607 asm volatile("sha256msg1 0x12(%ebp,%eax,1), %xmm0"); 2608 asm volatile("sha256msg1 0x12(%eax,%ecx,1), %xmm0"); 2609 asm volatile("sha256msg1 0x12(%eax,%ecx,8), %xmm0"); 2610 asm volatile("sha256msg1 0x12345678(%eax), %xmm0"); 2611 asm volatile("sha256msg1 0x12345678(%ebp), %xmm0"); 2612 asm volatile("sha256msg1 0x12345678(%ecx,%eax,1), %xmm0"); 2613 asm volatile("sha256msg1 0x12345678(%ebp,%eax,1), %xmm0"); 2614 asm volatile("sha256msg1 0x12345678(%eax,%ecx,1), %xmm0"); 2615 asm volatile("sha256msg1 0x12345678(%eax,%ecx,8), %xmm0"); 2616 2617 /* sha256msg2 xmm2/m128, xmm1 */ 2618 2619 asm volatile("sha256msg2 %xmm1, %xmm0"); 2620 asm volatile("sha256msg2 %xmm7, %xmm2"); 2621 asm volatile("sha256msg2 (%eax), %xmm0"); 2622 asm volatile("sha256msg2 (0x12345678), %xmm0"); 2623 asm volatile("sha256msg2 (%eax), %xmm3"); 2624 asm volatile("sha256msg2 (%ecx,%eax,1), %xmm0"); 2625 asm volatile("sha256msg2 0x12345678(,%eax,1), %xmm0"); 2626 asm volatile("sha256msg2 (%eax,%ecx,1), %xmm0"); 2627 asm volatile("sha256msg2 (%eax,%ecx,8), %xmm0"); 2628 asm volatile("sha256msg2 0x12(%eax), %xmm0"); 2629 asm volatile("sha256msg2 0x12(%ebp), %xmm0"); 2630 asm volatile("sha256msg2 0x12(%ecx,%eax,1), %xmm0"); 2631 asm volatile("sha256msg2 0x12(%ebp,%eax,1), %xmm0"); 2632 asm volatile("sha256msg2 0x12(%eax,%ecx,1), %xmm0"); 2633 asm volatile("sha256msg2 0x12(%eax,%ecx,8), %xmm0"); 2634 asm volatile("sha256msg2 0x12345678(%eax), %xmm0"); 2635 asm volatile("sha256msg2 0x12345678(%ebp), %xmm0"); 2636 asm volatile("sha256msg2 0x12345678(%ecx,%eax,1), %xmm0"); 2637 asm volatile("sha256msg2 0x12345678(%ebp,%eax,1), %xmm0"); 2638 asm volatile("sha256msg2 0x12345678(%eax,%ecx,1), %xmm0"); 2639 asm volatile("sha256msg2 0x12345678(%eax,%ecx,8), %xmm0"); 2640 2641 /* clflushopt m8 */ 2642 2643 asm volatile("clflushopt (%eax)"); 2644 asm volatile("clflushopt (0x12345678)"); 2645 asm volatile("clflushopt 0x12345678(%eax,%ecx,8)"); 2646 /* Also check instructions in the same group encoding as clflushopt */ 2647 asm volatile("clflush (%eax)"); 2648 asm volatile("sfence"); 2649 2650 /* clwb m8 */ 2651 2652 asm volatile("clwb (%eax)"); 2653 asm volatile("clwb (0x12345678)"); 2654 asm volatile("clwb 0x12345678(%eax,%ecx,8)"); 2655 /* Also check instructions in the same group encoding as clwb */ 2656 asm volatile("xsaveopt (%eax)"); 2657 asm volatile("mfence"); 2658 2659 /* xsavec mem */ 2660 2661 asm volatile("xsavec (%eax)"); 2662 asm volatile("xsavec (0x12345678)"); 2663 asm volatile("xsavec 0x12345678(%eax,%ecx,8)"); 2664 2665 /* xsaves mem */ 2666 2667 asm volatile("xsaves (%eax)"); 2668 asm volatile("xsaves (0x12345678)"); 2669 asm volatile("xsaves 0x12345678(%eax,%ecx,8)"); 2670 2671 /* xrstors mem */ 2672 2673 asm volatile("xrstors (%eax)"); 2674 asm volatile("xrstors (0x12345678)"); 2675 asm volatile("xrstors 0x12345678(%eax,%ecx,8)"); 2676 2677 /* ptwrite */ 2678 2679 asm volatile("ptwrite (%eax)"); 2680 asm volatile("ptwrite (0x12345678)"); 2681 asm volatile("ptwrite 0x12345678(%eax,%ecx,8)"); 2682 2683 asm volatile("ptwritel (%eax)"); 2684 asm volatile("ptwritel (0x12345678)"); 2685 asm volatile("ptwritel 0x12345678(%eax,%ecx,8)"); 2686 2687 #endif /* #ifndef __x86_64__ */ 2688 2689 /* Following line is a marker for the awk script - do not change */ 2690 asm volatile("rdtsc"); /* Stop here */ 2691 2692 return 0; 2693 } 2694